{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"tempo","owner":"databrickslabs","isFork":false,"description":"API for manipulating time series on top of Apache Spark: lagged time values, rolling statistics (mean, avg, sum, count, etc), AS OF joins, downsampling, and interpolation","allTopics":["python","scala","timeseries-data","timeseries-analysis","data-science","timeseries","time-series","pandas","data-analysis"],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":11,"issueCount":33,"starsCount":297,"forksCount":50,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-02T01:29:33.171Z"}},{"type":"Public","name":"dbldatagen","owner":"databrickslabs","isFork":false,"description":"Generate relevant synthetic data quickly for your projects. The Databricks Labs synthetic data generator (aka `dbldatagen`) may be used to generate large simulated / synthetic data sets for test, POCs, and other uses in Databricks environments including in Delta Live Tables pipelines","allTopics":["spark","faker","pyspark","spark-streaming","data-generation","databricks","synthetic-data","datagen","datagenerator","deltalake","datageneration","delta-live-tables","python"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":13,"issueCount":13,"starsCount":272,"forksCount":53,"license":"Other","participation":[0,1,0,1,1,2,0,0,0,0,0,0,0,0,0,0,0,2,0,0,0,0,0,0,1,0,0,0,1,0,0,0,0,0,0,0,0,1,1,0,0,0,1,0,0,0,0,0,0,0,3,2],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-01T22:01:59.785Z"}},{"type":"Public","name":"ucx","owner":"databrickslabs","isFork":false,"description":"Your best companion for upgrading to Unity Catalog. UCX will guide you, the Databricks customer, through the process of upgrading your account, groups, workspaces, jobs etc. to Unity Catalog.","allTopics":["databricks","unity-catalog","databricks-cli-installable"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":6,"issueCount":117,"starsCount":171,"forksCount":64,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-01T09:34:26.411Z"}},{"type":"Public","name":"overwatch","owner":"databrickslabs","isFork":false,"description":"Capture deep metrics on one or all assets within a Databricks workspace","allTopics":["monitoring","databricks"],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":15,"issueCount":140,"starsCount":219,"forksCount":59,"license":"Other","participation":[2,2,6,0,0,0,0,0,5,1,0,0,0,0,1,0,0,1,0,0,0,1,0,2,4,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,1,0,0,0,0,0,0,1,0,1,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-31T20:14:08.425Z"}},{"type":"Public","name":"remorph","owner":"databrickslabs","isFork":false,"description":"Cross-compiler and Data Reconciler into Databricks Lakehouse","allTopics":["reconciliation","data-validation","transpiler","databricks"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":14,"issueCount":106,"starsCount":15,"forksCount":10,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,1,1,0,0,0,0,1,0,0,0,4,10,8,8,6,4,7,9,5,7,5,7,10,11,12,20,10,19,9,22,17],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-31T20:03:40.339Z"}},{"type":"Public","name":"lsql","owner":"databrickslabs","isFork":false,"description":"Lightweight SQL execution wrapper only on top of Databricks SDK","allTopics":["databricks","databricks-sql","databricks-sdk"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":19,"starsCount":3,"forksCount":1,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-31T10:30:03.278Z"}},{"type":"Public","name":"blueprint","owner":"databrickslabs","isFork":false,"description":"Baseline for Databricks Labs projects written in Python ","allTopics":["python","cli","databricks","databricks-cli-installable"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":3,"starsCount":11,"forksCount":6,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,3,12,11,0,2,3,11,0,2,4,5,7,9,1,4,5,0,0,2,0,3,3,5,2],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-30T20:21:53.064Z"}},{"type":"Public","name":"mosaic","owner":"databrickslabs","isFork":false,"description":"An extension to the Apache Spark framework that allows easy and fast processing of very large geospatial datasets.","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":9,"issueCount":57,"starsCount":254,"forksCount":61,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-28T20:46:44.644Z"}},{"type":"Public","name":"sandbox","owner":"databrickslabs","isFork":false,"description":"Experimental or low-maturity things","allTopics":["databricks","databricks-api","databricks-sdk"],"primaryLanguage":{"name":"Go","color":"#00ADD8"},"pullRequestCount":16,"issueCount":6,"starsCount":16,"forksCount":4,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-28T16:01:17.410Z"}},{"type":"Public","name":"dbignite","owner":"databrickslabs","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":1,"starsCount":22,"forksCount":10,"license":"Other","participation":[4,4,35,9,8,38,3,6,5,0,0,0,0,1,0,11,0,0,9,1,0,1,6,0,0,1,0,30,0,5,10,18,0,0,0,0,0,0,1,0,0,0,0,1,0,0,0,5,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-20T08:19:35.243Z"}},{"type":"Public","name":"dlt-meta","owner":"databrickslabs","isFork":false,"description":"This is metadata driven DLT based framework for bronze/silver pipelines","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":15,"starsCount":123,"forksCount":53,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-09T23:29:32.612Z"}},{"type":"Public","name":"dataframe-rules-engine","owner":"databrickslabs","isFork":false,"description":"Extensible Rules Engine for custom Dataframe / Dataset validation","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":4,"issueCount":8,"starsCount":133,"forksCount":30,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-07T21:04:37.881Z"}},{"type":"Public","name":"splunk-integration","owner":"databrickslabs","isFork":false,"description":"Databricks Add-on for Splunk","allTopics":["cybersecurity","databricks","databricks-notebooks","splunk-addon"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":3,"issueCount":15,"starsCount":26,"forksCount":17,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-07T10:27:01.996Z"}},{"type":"Public","name":"pylint-plugin","owner":"databrickslabs","isFork":false,"description":"Databricks Plugin for PyLint","allTopics":["python","databricks","pylint-plugin"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":11,"starsCount":7,"forksCount":2,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-26T12:01:18.287Z"}},{"type":"Public","name":"databricks-sdk-r","owner":"databrickslabs","isFork":false,"description":"Databricks SDK for R (Experimental)","allTopics":["data-science","r","sdk","databricks"],"primaryLanguage":{"name":"R","color":"#198CE7"},"pullRequestCount":1,"issueCount":6,"starsCount":20,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-08T10:28:16.311Z"}},{"type":"Public","name":"tika-ocr","owner":"databrickslabs","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Rich Text Format","color":"#ccc"},"pullRequestCount":4,"issueCount":2,"starsCount":17,"forksCount":2,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-03T20:25:20.972Z"}},{"type":"Public","name":"discoverx","owner":"databrickslabs","isFork":false,"description":"A Swiss-Army-knife for your Data Intelligence platform administration.","allTopics":["scanning","data-retrieval","pii-detection","semantic-classification","multi-table-operations"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":10,"issueCount":7,"starsCount":98,"forksCount":9,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-27T11:23:04.648Z"}},{"type":"Public","name":"delta-sharing-java-connector","owner":"databrickslabs","isFork":false,"description":"A Java connector for delta.io/sharing/ that allows you to easily ingest data on any JVM.","allTopics":["java","delta-sharing"],"primaryLanguage":{"name":"Java","color":"#b07219"},"pullRequestCount":2,"issueCount":2,"starsCount":12,"forksCount":5,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-25T18:59:46.547Z"}},{"type":"Public","name":"transpiler","owner":"databrickslabs","isFork":false,"description":"SIEM-to-Spark Transpiler","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":5,"issueCount":13,"starsCount":39,"forksCount":5,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-18T20:31:06.843Z"}},{"type":"Public","name":"smolder","owner":"databrickslabs","isFork":false,"description":"HL7 Apache Spark Datasource","allTopics":["spark","hl7","datasource","hl7v2"],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":0,"issueCount":1,"starsCount":57,"forksCount":20,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-03-15T17:53:23.893Z"}},{"type":"Public","name":"dbx","owner":"databrickslabs","isFork":false,"description":"🧱 Databricks CLI eXtensions - aka dbx is a CLI tool for development and advanced Databricks workflows management.","allTopics":["ci","cicd","databricks","mlops","databricks-cli","databricks-api"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":12,"issueCount":91,"starsCount":435,"forksCount":119,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-26T13:26:25.713Z"}},{"type":"Public","name":"doc-qa","owner":"databrickslabs","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":4,"issueCount":0,"starsCount":41,"forksCount":5,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-02-23T06:55:32.059Z"}},{"type":"Public","name":"databricks-sync","owner":"databrickslabs","isFork":false,"description":"An experimental tool to synchronize source Databricks deployment with a target Databricks deployment.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":7,"issueCount":16,"starsCount":46,"forksCount":12,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-01-21T19:34:04.619Z"}},{"type":"Public","name":"arcuate","owner":"databrickslabs","isFork":false,"description":"Delta Sharing + MLflow for ML model & experiment exchange (arcuate delta - a fan shaped river delta)","allTopics":["big-data","spark","data-sharing","mlflow","delta-sharing"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":9,"issueCount":0,"starsCount":21,"forksCount":1,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-27T15:16:04.250Z"}},{"type":"Public","name":"feature-factory","owner":"databrickslabs","isFork":false,"description":"Accelerator to rapidly deploy customized features for your business","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":4,"issueCount":1,"starsCount":54,"forksCount":25,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-12-10T20:34:04.112Z"}},{"type":"Public","name":"delta-oms","owner":"databrickslabs","isFork":false,"description":"DeltaOMS is a solution that help build a centralized repository of Delta Transaction logs and associated operational metrics/statistics for your Delta Lakehouse. Unity Catalog supported in the v0.7.0-rc1 release.Documentation here - https://databrickslabs.github.io/delta-oms/v0.7.0-rc1/","allTopics":["monitoring","metrics","delta","centralized","databricks","delta-lake","lakehouse"],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":1,"issueCount":6,"starsCount":36,"forksCount":3,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-27T22:06:31.489Z"}},{"type":"Public","name":"partner-connect-api","owner":"databrickslabs","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":11,"issueCount":1,"starsCount":12,"forksCount":3,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-27T22:05:07.253Z"}},{"type":"Public","name":"migrate","owner":"databrickslabs","isFork":false,"description":"Old scripts for one-off ST-to-E2 migrations. Use \"terraform exporter\" linked in the readme.","allTopics":["databricks-migration"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":7,"issueCount":42,"starsCount":174,"forksCount":123,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-11-27T22:01:42.597Z"}},{"type":"Public","name":"dolly","owner":"databrickslabs","isFork":false,"description":"Databricks’ Dolly, a large language model trained on the Databricks Machine Learning Platform","allTopics":["chatbot","gpt","databricks","dolly"],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":5,"starsCount":10793,"forksCount":1160,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-06-30T18:36:16.616Z"}},{"type":"Public","name":"geoscan","owner":"databrickslabs","isFork":false,"description":"Geospatial clustering at massive scale","allTopics":["library","spark-ml","clustering"],"primaryLanguage":{"name":"Scala","color":"#c22d40"},"pullRequestCount":5,"issueCount":2,"starsCount":91,"forksCount":19,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-05-22T01:58:31.628Z"}}],"repositoryCount":34,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"Repositories"}