{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"mosaic","owner":"databrickslabs","isFork":false,"description":"An extension to the Apache Spark framework that allows easy and fast processing of very large geospatial datasets.","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":11,"issueCount":57,"starsCount":256,"forksCount":61,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-09T22:49:40.989Z"}},{"type":"Public","name":"ucx","owner":"databrickslabs","isFork":false,"description":"Your best companion for upgrading to Unity Catalog. UCX will guide you, the Databricks customer, through the process of upgrading your account, groups, workspaces, jobs etc. to Unity Catalog.","allTopics":["databricks","unity-catalog","databricks-cli-installable"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":7,"issueCount":108,"starsCount":172,"forksCount":64,"license":"Other","participation":[2,1,2,0,19,1,8,9,7,3,7,16,31,14,36,18,30,28,10,12,4,5,15,10,14,6,17,18,8,7,9,19,13,10,11,15,18,12,36,21,22,45,33,28,42,37,31,42,10,33,31,25],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-09T17:23:06.114Z"}},{"type":"Public","name":"remorph","owner":"databrickslabs","isFork":false,"description":"Cross-compiler and Data Reconciler into Databricks Lakehouse","allTopics":["reconciliation","data-validation","transpiler","databricks"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":8,"issueCount":109,"starsCount":16,"forksCount":10,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,1,1,0,0,0,0,1,0,0,0,4,10,8,8,6,4,7,9,5,7,5,7,10,11,12,20,10,19,9,22,17,21],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-09T05:11:27.661Z"}},{"type":"Public","name":"dbldatagen","owner":"databrickslabs","isFork":false,"description":"Generate relevant synthetic data quickly for your projects. The Databricks Labs synthetic data generator (aka `dbldatagen`) may be used to generate large simulated / synthetic data sets for test, POCs, and other uses in Databricks environments including in Delta Live Tables pipelines","allTopics":["spark","faker","pyspark","spark-streaming","data-generation","databricks","synthetic-data","datagen","datagenerator","deltalake","datageneration","delta-live-tables","python"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":11,"issueCount":13,"starsCount":278,"forksCount":55,"license":"Other","participation":[1,0,1,1,2,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,1,1,0,0,0,1,0,0,0,0,0,0,0,3,2,5],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-08T03:47:16.093Z"}},{"type":"Public","name":"overwatch","owner":"databrickslabs","isFork":false,"description":"Capture deep metrics on one or all assets within a Databricks workspace","allTopics":["monitoring","databricks"],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":15,"issueCount":136,"starsCount":219,"forksCount":59,"license":"Other","participation":[2,6,0,0,0,0,0,5,1,0,0,0,0,1,0,0,1,0,0,0,1,0,2,4,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,1,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-07T13:46:56.142Z"}},{"type":"Public","name":"dbignite","owner":"databrickslabs","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":22,"forksCount":10,"license":"Other","participation":[4,35,9,8,38,3,6,5,0,0,0,0,1,0,11,0,0,9,1,0,1,6,0,0,1,0,30,0,5,10,18,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,5,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-06T15:07:21.749Z"}},{"type":"Public","name":"sandbox","owner":"databrickslabs","isFork":false,"description":"Experimental or low-maturity things","allTopics":["databricks","databricks-api","databricks-sdk"],"primaryLanguage":{"name":"Go","color":"#00ADD8"},"pullRequestCount":18,"issueCount":6,"starsCount":16,"forksCount":4,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,5,0,0,15,2,1,7,0,8,12,3,7,2,9,16,20,4,10,1,3,11,7,8,1,0,0,0,0,2,1,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-05T15:14:22.691Z"}},{"type":"Public","name":"tempo","owner":"databrickslabs","isFork":false,"description":"API for manipulating time series on top of Apache Spark: lagged time values, rolling statistics (mean, avg, sum, count, etc), AS OF joins, downsampling, and interpolation","allTopics":["python","scala","timeseries-data","timeseries-analysis","data-science","timeseries","time-series","pandas","data-analysis"],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":11,"issueCount":33,"starsCount":301,"forksCount":50,"license":"Other","participation":[0,0,0,0,0,2,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,1,0,0,0,0,3,0,0,0,0,0,0,2,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-04T01:33:59.171Z"}},{"type":"Public","name":"dlt-meta","owner":"databrickslabs","isFork":false,"description":"This is metadata driven DLT based framework for bronze/silver pipelines","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":15,"starsCount":123,"forksCount":53,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-03T18:18:32.612Z"}},{"type":"Public","name":"lsql","owner":"databrickslabs","isFork":false,"description":"Lightweight SQL execution wrapper only on top of Databricks SDK","allTopics":["databricks","databricks-sql","databricks-sdk"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":19,"starsCount":3,"forksCount":1,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,4,2,0,1,0,0,0,0,0,0,0,1,0,0,0,1,1,2,1,1,0,0,2,15,5,10,7,4,2,1,0,2,0,5,2,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-31T10:30:03.278Z"}},{"type":"Public","name":"blueprint","owner":"databrickslabs","isFork":false,"description":"Baseline for Databricks Labs projects written in Python ","allTopics":["python","cli","databricks","databricks-cli-installable"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":11,"forksCount":6,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-30T20:21:53.064Z"}},{"type":"Public","name":"dataframe-rules-engine","owner":"databrickslabs","isFork":false,"description":"Extensible Rules Engine for custom Dataframe / Dataset validation","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":4,"issueCount":8,"starsCount":133,"forksCount":30,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-07T21:04:37.881Z"}},{"type":"Public","name":"splunk-integration","owner":"databrickslabs","isFork":false,"description":"Databricks Add-on for Splunk","allTopics":["cybersecurity","databricks","databricks-notebooks","splunk-addon"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":15,"starsCount":26,"forksCount":17,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-07T10:27:01.996Z"}},{"type":"Public","name":"pylint-plugin","owner":"databrickslabs","isFork":false,"description":"Databricks Plugin for PyLint","allTopics":["python","databricks","pylint-plugin"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":11,"starsCount":7,"forksCount":2,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-26T12:01:18.287Z"}},{"type":"Public","name":"databricks-sdk-r","owner":"databrickslabs","isFork":false,"description":"Databricks SDK for R (Experimental)","allTopics":["data-science","r","sdk","databricks"],"primaryLanguage":{"name":"R","color":"#198CE7"},"pullRequestCount":1,"issueCount":6,"starsCount":20,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-08T10:28:16.311Z"}},{"type":"Public","name":"tika-ocr","owner":"databrickslabs","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Rich Text Format","color":"#ccc"},"pullRequestCount":4,"issueCount":2,"starsCount":17,"forksCount":2,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-03T20:25:20.972Z"}},{"type":"Public","name":"discoverx","owner":"databrickslabs","isFork":false,"description":"A Swiss-Army-knife for your Data Intelligence platform administration.","allTopics":["scanning","data-retrieval","pii-detection","semantic-classification","multi-table-operations"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":10,"issueCount":7,"starsCount":98,"forksCount":9,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-27T11:23:04.648Z"}},{"type":"Public","name":"delta-sharing-java-connector","owner":"databrickslabs","isFork":false,"description":"A Java connector for delta.io/sharing/ that allows you to easily ingest data on any JVM.","allTopics":["java","delta-sharing"],"primaryLanguage":{"name":"Java","color":"#b07219"},"pullRequestCount":2,"issueCount":2,"starsCount":12,"forksCount":5,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-25T18:59:46.547Z"}},{"type":"Public","name":"transpiler","owner":"databrickslabs","isFork":false,"description":"SIEM-to-Spark Transpiler","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":5,"issueCount":13,"starsCount":40,"forksCount":5,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-18T20:31:06.843Z"}},{"type":"Public","name":"smolder","owner":"databrickslabs","isFork":false,"description":"HL7 Apache Spark Datasource","allTopics":["spark","hl7","datasource","hl7v2"],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":0,"issueCount":1,"starsCount":57,"forksCount":20,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-15T17:53:23.893Z"}},{"type":"Public","name":"dbx","owner":"databrickslabs","isFork":false,"description":"🧱 Databricks CLI eXtensions - aka dbx is a CLI tool for development and advanced Databricks workflows management.","allTopics":["ci","cicd","databricks","mlops","databricks-cli","databricks-api"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":12,"issueCount":91,"starsCount":435,"forksCount":120,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-26T13:26:25.713Z"}},{"type":"Public","name":"doc-qa","owner":"databrickslabs","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":4,"issueCount":0,"starsCount":41,"forksCount":5,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-23T06:55:32.059Z"}},{"type":"Public","name":"databricks-sync","owner":"databrickslabs","isFork":false,"description":"An experimental tool to synchronize source Databricks deployment with a target Databricks deployment.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":7,"issueCount":16,"starsCount":46,"forksCount":12,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-21T19:34:04.619Z"}},{"type":"Public","name":"arcuate","owner":"databrickslabs","isFork":false,"description":"Delta Sharing + MLflow for ML model & experiment exchange (arcuate delta - a fan shaped river delta)","allTopics":["big-data","spark","data-sharing","mlflow","delta-sharing"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":9,"issueCount":0,"starsCount":21,"forksCount":1,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-27T15:16:04.250Z"}},{"type":"Public","name":"feature-factory","owner":"databrickslabs","isFork":false,"description":"Accelerator to rapidly deploy customized features for your business","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":4,"issueCount":1,"starsCount":55,"forksCount":25,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-10T20:34:04.112Z"}},{"type":"Public","name":"delta-oms","owner":"databrickslabs","isFork":false,"description":"DeltaOMS is a solution that help build a centralized repository of Delta Transaction logs and associated operational metrics/statistics for your Delta Lakehouse. Unity Catalog supported in the v0.7.0-rc1 release.Documentation here - https://databrickslabs.github.io/delta-oms/v0.7.0-rc1/","allTopics":["monitoring","metrics","delta","centralized","databricks","delta-lake","lakehouse"],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":1,"issueCount":6,"starsCount":36,"forksCount":3,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-27T22:06:31.489Z"}},{"type":"Public","name":"partner-connect-api","owner":"databrickslabs","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":11,"issueCount":1,"starsCount":12,"forksCount":3,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-27T22:05:07.253Z"}},{"type":"Public","name":"migrate","owner":"databrickslabs","isFork":false,"description":"Old scripts for one-off ST-to-E2 migrations. Use \"terraform exporter\" linked in the readme.","allTopics":["databricks-migration"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":7,"issueCount":42,"starsCount":175,"forksCount":123,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-27T22:01:42.597Z"}},{"type":"Public","name":"dolly","owner":"databrickslabs","isFork":false,"description":"Databricks’ Dolly, a large language model trained on the Databricks Machine Learning Platform","allTopics":["chatbot","gpt","databricks","dolly"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":10794,"forksCount":1158,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-06-30T18:36:16.616Z"}},{"type":"Public","name":"geoscan","owner":"databrickslabs","isFork":false,"description":"Geospatial clustering at massive scale","allTopics":["library","spark-ml","clustering"],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":5,"issueCount":2,"starsCount":91,"forksCount":19,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-05-22T01:58:31.628Z"}}],"repositoryCount":34,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}