{"payload":{"pageCount":1,"repositories":[{"type":"Public","name":"velox","owner":"oap-project","isFork":true,"description":"A new C++ vectorized database acceleration library aimed to optimizing query engines and data processing systems.","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":20,"issueCount":8,"starsCount":17,"forksCount":1076,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-28T01:10:06.886Z"}},{"type":"Public","name":"raydp","owner":"oap-project","isFork":false,"description":"RayDP provides simple APIs for running Spark on Ray and integrating Spark with AI libraries.","allTopics":["ray","spark"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":10,"issueCount":32,"starsCount":293,"forksCount":66,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-26T07:25:46.025Z"}},{"type":"Public","name":"libhdfs3","owner":"oap-project","isFork":true,"description":"HDFS file read access for ClickHouse","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":1,"issueCount":0,"starsCount":2,"forksCount":53,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-25T07:08:59.399Z"}},{"type":"Public","name":"text2sql-gluten","owner":"oap-project","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":5,"forksCount":3,"license":null,"participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,5,1,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-15T08:09:35.183Z"}},{"type":"Public","name":"pyspark-ai","owner":"oap-project","isFork":true,"description":"English SDK for Apache Spark","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":120,"license":"Apache License 2.0","participation":[9,3,2,7,2,10,5,2,1,2,2,4,10,13,4,8,2,9,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,1,1,1,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-08T05:06:55.750Z"}},{"type":"Public archive","name":"oap-tools","owner":"oap-project","isFork":false,"description":"Tools for building, packaging, and OAP public cloud integrations such as AWS EMR, Google Dataproc and K8S. ","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":2,"issueCount":9,"starsCount":16,"forksCount":13,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-27T06:14:30.626Z"}},{"type":"Public","name":"spark-ai-kit","owner":"oap-project","isFork":true,"description":"Gluten: Plugin to Double SparkSQL's Performance","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":376,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-26T02:54:23.592Z"}},{"type":"Public","name":"oap-mllib","owner":"oap-project","isFork":false,"description":"Optimized Spark package to accelerate machine learning algorithms in Apache Spark MLlib.","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":5,"issueCount":34,"starsCount":20,"forksCount":12,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-26T02:22:59.226Z"}},{"type":"Public","name":"remote-shuffle","owner":"oap-project","isFork":false,"description":" Spark* shuffle plugin for support shuffling data through a remote Hadoop-compatible file system, as opposed to vanilla Spark's local-disks.","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":1,"issueCount":4,"starsCount":19,"forksCount":12,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-15T07:30:56.927Z"}},{"type":"Public","name":"protobuf","owner":"oap-project","isFork":true,"description":"A Intel customized Protocol Buffers - Google's data interchange format","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":1,"issueCount":0,"starsCount":0,"forksCount":15344,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-21T12:59:54.343Z"}},{"type":"Public archive","name":"Gluten-Trino","owner":"oap-project","isFork":false,"description":"Gluten: Plugin to Boost Trino's Performance","allTopics":[],"primaryLanguage":{"name":"Java","color":"#b07219"},"pullRequestCount":1,"issueCount":6,"starsCount":67,"forksCount":13,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-25T02:09:49.220Z"}},{"type":"Public archive","name":"cloudtik","owner":"oap-project","isFork":false,"description":"Cloud Scale Platform for Distributed Analytics and AI","allTopics":["machine-learning","cloud","ai","spark","deep-learning","analytics","alibabacloud","kubernetes","aws","azure","gcp"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":1,"starsCount":23,"forksCount":7,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-10-12T15:34:17.499Z"}},{"type":"Public archive","name":"pmem-shuffle","owner":"oap-project","isFork":false,"description":"Spark* Shuffle plugin for support shuffling through remote persistent memory over fabrics, which leverages the RDMA network and remote persistent memory (for read) to provide extremely high performance and low latency shuffle solutions for Spark*.","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":1,"issueCount":15,"starsCount":14,"forksCount":9,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-18T20:04:11.109Z"}},{"type":"Public archive","name":"recdp","owner":"oap-project","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":2,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-18T19:28:23.556Z"}},{"type":"Public archive","name":"oap-project.github.io","owner":"oap-project","isFork":false,"description":"The OAP project web site","allTopics":[],"primaryLanguage":{"name":"HTML","color":"#e34c26"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-09-05T05:04:03.632Z"}},{"type":"Public","name":"arrow","owner":"oap-project","isFork":true,"description":"Apache Arrow is a cross-language development platform for in-memory data. It specifies a standardized language-independent columnar memory format for flat and hierarchical data, organized for efficient analytic operations on modern hardware. It also provides computational libraries and zero-copy streaming messaging and interprocess communication…","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":21,"issueCount":0,"starsCount":6,"forksCount":3373,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-05-18T08:25:34.673Z"}},{"type":"Public archive","name":"gazelle_plugin","owner":"oap-project","isFork":false,"description":"Native SQL Engine plugin for Spark SQL with vectorized SIMD optimizations.","allTopics":["spark","arrow","native-sql-engine","vectorized-simd-optimizations","native-kernels"],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":24,"issueCount":191,"starsCount":256,"forksCount":77,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-02-21T07:48:24.508Z"}},{"type":"Public archive","name":"solution-navigator","owner":"oap-project","isFork":false,"description":"Example solutions or code for using OAP features.","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":3,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-01-25T20:11:59.848Z"}},{"type":"Public archive","name":"sql-ds-cache","owner":"oap-project","isFork":false,"description":"Spark* plug-in for accelerating Spark* SQL performance by using cache and index at SQL data source layer.","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":4,"issueCount":15,"starsCount":37,"forksCount":25,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-01-03T22:55:10.332Z"}},{"type":"Public archive","name":"libhdfs3-downstream","owner":"oap-project","isFork":true,"description":"a native c/c++ hdfs client (downstream fork from apache-hawq)","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":54,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-01-03T22:55:08.506Z"}},{"type":"Public archive","name":"arrow-data-source","owner":"oap-project","isFork":false,"description":"Spark DataSouce plugin for reading files from various formats like Parquet into Arrow compatible columnar vectors.","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":0,"issueCount":3,"starsCount":6,"forksCount":11,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-01-03T22:55:06.730Z"}},{"type":"Public archive","name":"pmem-spill","owner":"oap-project","isFork":false,"description":"Spark plug-in package for accelerating Spark runtime spill functions using PMem such as RDD cache PMem extension.","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":1,"issueCount":11,"starsCount":7,"forksCount":5,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-12-15T01:56:29.075Z"}},{"type":"Public archive","name":"pmem-common","owner":"oap-project","isFork":false,"description":"Common library for accessing PMEM native library functions including memkind, vmemcache and so on.","allTopics":[],"primaryLanguage":{"name":"Java","color":"#b07219"},"pullRequestCount":1,"issueCount":3,"starsCount":3,"forksCount":7,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2021-12-14T05:35:52.222Z"}}],"repositoryCount":23,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}