About: Apache Spark

Property	Value
dbo:author	dbr:Matei_Zaharia
dbo:description	framework van Apache Software Foundation (nl) plataforma de análisis de datos de forma distribuida (es) オープンソースのデータ分析クラスタ・コンピューティングフレームワーク (ja) фреймворк распределённой обработки данных, входит в экосистему Hadoop (ru) framework de traitement et de calcul distribué (fr) framework open source per il calcolo distribuito (it) open-source softvér na analýzu dát (sk) ανοιχτού κώδικα που υποστηρίζει την κατανεμημένη επεξεργασία μεγάλου όγκου δεδομένων (el) open-source data analytics cluster computing framework (en) quelloffenes Datenanalyse- und Cluster-Computing-Framework (de) plataforma d'anàlisi de dades de forma distribuïda (ca)
dbo:genre	dbr:Machine_learning
dbo:language	dbr:Java_(programming_language) dbr:C_Sharp_(programming_language) dbr:F_Sharp_(programming_language) dbr:Python_(programming_language) dbr:Scala_(programming_language) dbr:R_(programming_language) dbr:SQL
dbo:latestReleaseDate	2025-05-23 (xsd:date)
dbo:latestReleaseVersion	4.0.0 (Scala2.13)
dbo:license	dbr:Apache_License
dbo:operatingSystem	dbr:Linux dbr:Microsoft_Windows dbr:MacOS
dbo:programmingLanguage	dbr:Scala_(programming_language)
dbo:thumbnail	wiki-commons:Special:FilePath/Apache_Spark_logo.svg?width=300
dbo:wikiPageExternalLink	https://gitbox.apache.org/repos/asf%3Fp https://github.com/apache/spark/releases/tag/v1.0.0
dbo:wikiPageWikiLink	dbr:Filter_(computer_science) dbr:Latent_Dirichlet_allocation dbr:Fold_(higher-order_function) dbr:MapR dbr:Pipeline_(software) dbr:Codebase dbr:Kubernetes dbr:Java_(programming_language) dbr:Linux dbr:Microsoft_Windows dbr:Twitter dbr:Apache_Kafka dbr:.NET dbr:Amazon_Web_Services dbr:Apache_License dbr:BSD_licenses dbr:C_Sharp_(programming_language) dbr:Cloud_computing dbr:Collaborative_filtering dbr:Database dbr:F_Sharp_(programming_language) dbr:MacOS dbr:Machine_learning dbr:Principal_component_analysis dbr:Python_(programming_language) dbr:Scala_(programming_language) dbr:R_(programming_language) dbr:Data_center dbr:OpenStack dbr:Vowpal_Wabbit dbc:Java_platform dbc:Apache_Software_Foundation_projects dbr:Distributed_computing dbr:Julia_(programming_language) dbr:Open-source_software dbr:Apache_Hadoop dbr:Clustered_file_system dbr:Working_set dbr:Immutable_object dbr:On-premises_software dbr:Random_forest dbr:Dataflow dbr:Anonymous_function dbr:MapReduce dbr:Latency_(engineering) dbr:Big_data dbr:Java_Database_Connectivity dbr:Imperative_programming dbr:Naive_Bayes_classifier dbr:Graph_(abstract_data_type) dbr:Network_socket dbr:Databricks dbr:Map_(parallel_pattern) dbr:File:Apache_Spark_logo.svg dbr:SQL dbr:Data_parallelism dbr:Fault_tolerance dbr:Apache_Mahout dbr:Alluxio dbr:Apache_Mesos dbr:Apache_Flink dbr:Apache_Kudu dbr:Functional_programming dbr:PageRank dbr:Abstraction_(computer_science) dbr:Regression_analysis dbr:Decision_tree dbr:Logistic_regression dbr:Matei_Zaharia dbr:ZeroMQ dbr:Lambda_architecture dbr:Statistical_classification dbr:Set_(abstract_data_type) dbr:Shared_memory dbr:Directed_acyclic_graph dbr:Data_transformation_(statistics) dbr:Graph_database dbr:Command-line_interface dbr:Programming_paradigm dbr:Dimensionality_reduction dbr:Event_stream_processing dbr:Open_Database_Connectivity dbr:Semi-structured_data dbr:Lazy_evaluation dbr:Gradient_boosting dbr:Apache_Cassandra dbr:Cluster_analysis dbr:Lustre_(file_system) dbr:Domain-specific_language dbr:Linear_regression dbr:K-means_clustering dbr:Singular_value_decomposition dbr:Amazon_S3 dbr:Stratified_sampling dbr:Stochastic_gradient_descent dbr:Feature_extraction dbr:Summary_statistics dbr:List_of_concurrent_and_parallel_programming_languages dbr:Higher-order_programming dbc:Hadoop dbr:Limited-memory_BFGS dbc:Data_mining_and_machine_learning_software dbr:AMPLab dbc:Articles_with_example_Scala_code dbc:Cluster_computing dbc:Free_software_programmed_in_Scala dbc:University_of_California,_Berkeley dbc:Big_data_products dbr:Cluster_manager dbc:Software_using_the_Apache_license dbr:Deprecated dbr:Correlation_and_dependence dbr:Apache_Flume dbr:Apache_License_2.0 dbr:Apache_Software_Foundation dbr:Application_programming_interface dbr:Support_vector_machines dbr:UC_Berkeley dbr:Optimization_(mathematics) dbr:Storm_(event_processor) dbr:Hypothesis_testing dbr:I/O_interface dbr:Fault-tolerant_computing dbr:CPU_core dbr:Iterative_algorithm dbr:Join_(database) dbr:Scale_(computing)
dbp:author	dbr:Matei_Zaharia
dbp:developer	Apache Spark (en)
dbp:genre	Data analytics, machine learning algorithms (en)
dbp:language	dbr:Java_(programming_language) dbr:C_Sharp_(programming_language) dbr:F_Sharp_(programming_language) dbr:Python_(programming_language) dbr:Scala_(programming_language) dbr:R_(programming_language) dbr:SQL
dbp:latestReleaseDate	2025-05-23 (xsd:date)
dbp:latestReleaseVersion	4 (xsd:integer)
dbp:license	dbr:Apache_License
dbp:logo	dbr:File:Apache_Spark_logo.svg
dbp:name	Apache Spark (en)
dbp:operatingSystem	dbr:Linux dbr:Microsoft_Windows dbr:MacOS
dbp:programmingLanguage	dbr:Scala_(programming_language)
dbp:released	https://github.com/apache/spark/releases/tag/v1.0.0
dbp:repo	https://gitbox.apache.org/repos/asf%3Fp
dbp:wikiPageUsesTemplate	dbt:Apache_Software_Foundation dbt:Efn dbt:Infobox_software dbt:Mono dbt:Notelist dbt:Official_URL dbt:Official_website dbt:R dbt:Reflist dbt:Short_description dbt:Start_date_and_age dbt:Version dbt:Parallel_computing
dct:subject	dbc:Java_platform dbc:Apache_Software_Foundation_projects dbc:Hadoop dbc:Data_mining_and_machine_learning_software dbc:Articles_with_example_Scala_code dbc:Cluster_computing dbc:Free_software_programmed_in_Scala dbc:University_of_California,_Berkeley dbc:Big_data_products dbc:Open_source_projects dbc:Software_using_the_Apache_license
gold:hypernym	dbr:Framework
rdf:type	owl:Thing dbo:Software dbo:Software dbo:Software wikidata:Q386724 wikidata:Q7397 dbo:Work dbo:Work schema:CreativeWork
rdfs:label	Apache Spark (en) Apache Spark (ca) Apache Spark (de) Apache Spark (es) Apache Spark (fr) Apache Spark (it) 아파치 스파크 (ko) Apache Spark (ja) Apache Spark (pt) Apache Spark (pl) Apache Spark (uk) Apache Spark (ru) Apache Spark (zh)
owl:sameAs	freebase:Apache Spark yago-res:Apache Spark wikidata:Apache Spark dbpedia-de:Apache Spark dbpedia-es:Apache Spark dbpedia-it:Apache Spark dbpedia-pl:Apache Spark dbpedia-fr:Apache Spark dbpedia-he:Apache Spark dbpedia-ja:Apache Spark dbpedia-pt:Apache Spark dbpedia-ru:Apache Spark dbpedia-zh:Apache Spark dbpedia-ko:Apache Spark dbpedia-ca:Apache Spark dbpedia-fa:Apache Spark dbpedia-fi:Apache Spark dbpedia-uk:Apache Spark dbpedia-global:Apache Spark
prov:wasDerivedFrom	wikipedia-en:Apache_Spark?oldid=1305355033&ns=0
foaf:depiction	wiki-commons:Special:FilePath/Apache_Spark_logo.svg
foaf:isPrimaryTopicOf	wikipedia-en:Apache_Spark
foaf:name	Apache Spark (en)
is dbo:knownFor of	dbr:Holden_Karau dbr:Ion_Stoica dbr:Reynold_Xin dbr:Matei_Zaharia dbr:Ali_Ghodsi
is dbo:wikiPageDisambiguates of	dbr:Spark
is dbo:wikiPageRedirects of	dbr:PySpark dbr:GraphX dbr:Apache_spark dbr:Org.apache.spark dbr:Resilient_Distributed_Dataset dbr:Resilient_Distributed_Datasets dbr:Resilient_distributed_dataset dbr:Spark_(cluster_computing_framework)
is dbo:wikiPageWikiLink of	dbr:GenevaERS dbr:List_of_Apache_Software_Foundation_projects dbr:Google_Cloud_Platform dbr:KNIME dbr:Latent_Dirichlet_allocation dbr:Apache_Pig dbr:Dataflow_programming dbr:MapR dbr:Holden_Karau dbr:Elastic_net_regularization dbr:Convolutional_neural_network dbr:List_of_University_of_Waterloo_people dbr:Reverse_image_search dbr:Paxata dbr:Jean_Georges_Perrin dbr:University_of_Waterloo dbr:Tim_Howes dbr:Apache_Kafka dbr:Stream_processing dbr:Machine_learning dbr:Scala_(programming_language) dbr:R_(programming_language) dbr:Recurrent_neural_network dbr:Oracle_Cloud dbr:Apache_Hadoop dbr:Time_series dbr:C._Mohan dbr:Ion_Stoica dbr:Reynold_Xin dbr:Big_data dbr:BMC_Software dbr:Hortonworks dbr:Aiyara_cluster dbr:Databricks dbr:Data_lake dbr:Programming_model dbr:Graph_Query_Language dbr:Open_source dbr:Biostatistics dbr:Kernel_density_estimation dbr:Reza_Zadeh dbr:RDD dbr:Apache_Hive dbr:Apache_Mahout dbr:Apache_ZooKeeper dbr:Alluxio dbr:Apache_Mesos dbr:Data_Analytics_Library dbr:Apache_ORC dbr:Apache_Arrow dbr:Apache_CarbonData dbr:Apache_Parquet dbr:Apache_RocketMQ dbr:MinIO dbr:Isolation_forest dbr:Spark_NLP dbr:GeoTrellis dbr:Open_coopetition dbr:Merge_(SQL) dbr:Message_Passing_Interface dbr:PageRank dbr:Spatial_database dbr:Vertica dbr:Alibaba_Cloud dbr:Logistic_regression dbr:Spark dbr:Data_engineering dbr:Spectral_clustering dbr:HPCC dbr:Michael_J._Franklin dbr:Haoyuan_Li dbr:Matei_Zaharia dbr:Sematext dbr:Apache_Samza dbr:Deeplearning4j dbr:Lambda_architecture dbr:PickMe dbr:RevoScaleR dbr:Revoscalepy dbr:Jin_Li_(computer_scientist) dbr:Apache_Iceberg dbr:Autoregressive_integrated_moving_average dbr:List_of_sequence_alignment_software dbr:Graph_database dbr:Ali_Ghodsi dbr:Materialized_view dbr:Bzip2 dbr:International_Collegiate_Programming_Contest dbr:Cascading_(software) dbr:Gremlin_(query_language) dbr:SingleStore dbr:JanusGraph dbr:Apache_Avro dbr:Solution_stack dbr:Hypergraph dbr:Big_Data_Partnership dbr:Pipeline_(computing) dbr:K-means_clustering dbr:Notebook_interface dbr:Biomedical_text_mining dbr:Fuzzy_concept dbr:Apache_Storm dbr:Apache_SystemDS dbr:XGBoost dbr:JKool dbr:Apache_Beam dbr:Caffe_(software) dbr:Feature_hashing dbr:List_of_concurrent_and_parallel_programming_languages dbr:Outline_of_machine_learning dbr:List_of_programmers dbr:AMPLab dbr:Link_prediction dbr:Cray_Urika-XA dbr:List_of_big_data_companies dbr:List_of_Romanian_Americans dbr:Frequent_pattern_discovery dbr:List_of_commercial_open-source_applications_and_services dbr:List_of_Java_frameworks dbr:IBM_Watson_Studio dbr:Dataframe dbr:MapR_FS dbr:PySpark dbr:GraphX dbr:Matroid_(company) dbr:Apache_spark dbr:Org.apache.spark dbr:Resilient_Distributed_Dataset dbr:Resilient_Distributed_Datasets dbr:Resilient_distributed_dataset dbr:Spark_(cluster_computing_framework)
is dbp:knownFor of	dbr:Holden_Karau dbr:Ion_Stoica dbr:Reynold_Xin dbr:Matei_Zaharia
is foaf:primaryTopic of	wikipedia-en:Apache_Spark