{"payload":{"pageCount":2,"repositories":[{"type":"Public","name":"vllm-fork","owner":"HabanaAI","isFork":true,"description":"A high-throughput and memory-efficient inference and serving engine for LLMs","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":34,"issueCount":23,"starsCount":34,"forksCount":3977,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-21T00:23:34.087Z"}},{"type":"Public","name":"Gaudi-tutorials","owner":"HabanaAI","isFork":false,"description":"Tutorials for running models on First-gen Gaudi and Gaudi2 for Training and Inference. The source files for the tutorials on <a href=\"https://developer.habana.ai/\" rel=\"nofollow\">https://developer.habana.ai/</a>","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":3,"starsCount":47,"forksCount":31,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-20T20:56:05.187Z"}},{"type":"Public","name":"optimum-habana-fork","owner":"HabanaAI","isFork":true,"description":"Easy and lightning fast training of 🤗 Transformers on Habana Gaudi processor (HPU)","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":3,"forksCount":183,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-20T18:10:24.852Z"}},{"type":"Public","name":"vllm-hpu-extension","owner":"HabanaAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":0,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,7],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-20T13:44:42.879Z"}},{"type":"Public","name":"Model-References","owner":"HabanaAI","isFork":false,"description":"Reference models for Intel(R) Gaudi(R) AI Accelerator","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":8,"issueCount":12,"starsCount":152,"forksCount":76,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-16T21:57:52.136Z"}},{"type":"Public","name":"neural-compressor","owner":"HabanaAI","isFork":true,"description":"SOTA low-bit LLM quantization (INT8/FP8/INT4/FP4/NF4) &amp; sparsity; leading model compression techniques on TensorFlow, PyTorch, and ONNX Runtime","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":252,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-16T08:34:32.522Z"}},{"type":"Public","name":"Habana_Custom_Kernel","owner":"HabanaAI","isFork":false,"description":"Provides the examples to write and build Habana custom kernels using the HabanaTools","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":1,"issueCount":3,"starsCount":16,"forksCount":17,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-13T23:07:28.113Z"}},{"type":"Public","name":"hccl_ofi_wrapper","owner":"HabanaAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"BSD 3-Clause \"New\" or \"Revised\" License","participation":[0,0,0,0,0,1,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,2,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-12T10:31:54.010Z"}},{"type":"Public","name":"hccl_demo","owner":"HabanaAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":2,"issueCount":0,"starsCount":11,"forksCount":9,"license":"Apache License 2.0","participation":[0,0,0,0,0,4,2,0,0,0,0,2,2,2,0,0,2,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,1,2,0,0,0,0,0,0,0,0,1,1,0,0,1,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-03T14:42:29.594Z"}},{"type":"Public","name":"Megatron-LM","owner":"HabanaAI","isFork":true,"description":"Ongoing research training transformer models at scale","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":2260,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-09-02T16:54:06.114Z"}},{"type":"Public","name":"Megatron-DeepSpeed","owner":"HabanaAI","isFork":true,"description":"Intel Gaudi's Megatron DeepSpeed Large Language Models for training","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":12,"forksCount":2260,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-25T17:55:26.663Z"}},{"type":"Public","name":"DeepSpeed","owner":"HabanaAI","isFork":true,"description":"DeepSpeed is a deep learning optimization library that makes distributed training and inference easy, efficient, and effective.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":11,"forksCount":4052,"license":"Apache License 2.0","participation":[9,23,15,14,11,11,30,17,2,10,10,14,16,1,15,24,20,19,22,23,23,15,9,10,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-25T11:54:24.128Z"}},{"type":"Public","name":"Setup_and_Install","owner":"HabanaAI","isFork":false,"description":"Setup and Installation Instructions for Habana binaries, docker image creation","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":4,"issueCount":5,"starsCount":23,"forksCount":12,"license":"Apache License 2.0","participation":[0,1,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,1,0,0,0,0,0,2,0,0,0,2,0,0,0,0,0,0,0,0,2,0,1,1,0,0,0,0,0,2,0,2,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-23T19:02:55.805Z"}},{"type":"Public","name":"Fairseq","owner":"HabanaAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":2,"forksCount":1,"license":"MIT License","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-11T15:00:15.149Z"}},{"type":"Public","name":"HCL","owner":"HabanaAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":0,"issueCount":0,"starsCount":4,"forksCount":1,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-08-07T05:58:36.472Z"}},{"type":"Public","name":"AutoGPTQ","owner":"HabanaAI","isFork":true,"description":"An easy-to-use LLMs quantization package with user-friendly apis, based on GPTQ algorithm.","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":2,"issueCount":0,"starsCount":0,"forksCount":463,"license":"MIT License","participation":[15,0,0,1,5,11,6,3,2,0,3,7,0,0,0,0,1,4,1,0,20,4,4,0,0,7,10,1,2,2,0,6,0,0,0,0,0,1,2,3,5,3,1,0,1,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-31T09:01:14.808Z"}},{"type":"Public","name":"drivers.gpu.linux-nic.kernel","owner":"HabanaAI","isFork":false,"description":"NIC drivers (Ethernet, IBverbs and common) for the NIC IP that is inside Intel's data-center GPU","allTopics":[],"primaryLanguage":{"name":"C","color":"#555555"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":2,"license":"Other","participation":[1651,1849,1750,1837,1621,1183,1135,1291,1548,1892,2021,2007,1805,661,955,1238,1159,1883,2005,1754,2037,2090,1733,1716,1207,1306,1728,1720,1794,1471,1675,1349,939,484,389,284,163,13,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-25T06:23:23.654Z"}},{"type":"Public","name":"drivers.accel.habanalabs.kernel","owner":"HabanaAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"C","color":"#555555"},"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":0,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-24T14:39:13.916Z"}},{"type":"Public","name":"rdma-core","owner":"HabanaAI","isFork":true,"description":"RDMA core userspace libraries and daemons","allTopics":[],"primaryLanguage":{"name":"C","color":"#555555"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":676,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-24T07:09:27.105Z"}},{"type":"Public","name":"papers","owner":"HabanaAI","isFork":false,"description":"Academic papers by Habana research team","allTopics":[],"primaryLanguage":null,"pullRequestCount":0,"issueCount":0,"starsCount":1,"forksCount":2,"license":null,"participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-20T14:10:16.851Z"}},{"type":"Public","name":"habanalabs-k8s-device-plugin","owner":"HabanaAI","isFork":false,"description":"HABANA device plugin for Kubernetes","allTopics":["kubernetes","cloud"],"primaryLanguage":{"name":"Go","color":"#00ADD8"},"pullRequestCount":1,"issueCount":0,"starsCount":4,"forksCount":3,"license":"Apache License 2.0","participation":[0,0,0,0,0,0,2,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,2,0,2,0,1,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-17T15:12:07.752Z"}},{"type":"Public","name":"Gaudi2-Workshop","owner":"HabanaAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":8,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-17T07:06:54.305Z"}},{"type":"Public","name":"DeepSpeedExamples","owner":"HabanaAI","isFork":true,"description":"Example models using DeepSpeed","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":0,"issueCount":0,"starsCount":0,"forksCount":1019,"license":null,"participation":[0,11,4,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,1,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-07-02T06:53:00.890Z"}},{"type":"Public","name":"hl-thunk-open","owner":"HabanaAI","isFork":false,"description":"Thunk library for HabanaLabs kernel driver","allTopics":[],"primaryLanguage":{"name":"C","color":"#555555"},"pullRequestCount":0,"issueCount":0,"starsCount":4,"forksCount":8,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-16T06:45:40.125Z"}},{"type":"Public","name":"Intel_Gaudi3_Software","owner":"HabanaAI","isFork":false,"description":"Intel® Gaudi® Software is an implementation of the runtime and graph compiler for Gaudi3","allTopics":[],"primaryLanguage":{"name":"C++","color":"#f34b7d"},"pullRequestCount":0,"issueCount":0,"starsCount":4,"forksCount":3,"license":"Other","participation":[0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,0,4,6,0,0,0,0,0,0,0,0,0,0,0,0,0,0],"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-10T05:19:00.811Z"}},{"type":"Public","name":"habana-container-runtime","owner":"HabanaAI","isFork":false,"description":"Habana container runtime","allTopics":["docker","runtime","container"],"primaryLanguage":{"name":"Go","color":"#00ADD8"},"pullRequestCount":2,"issueCount":0,"starsCount":5,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-06T10:22:11.215Z"}},{"type":"Public","name":"gohlml","owner":"HabanaAI","isFork":false,"description":"HABANA Management Library bindings for Go","allTopics":[],"primaryLanguage":{"name":"Go","color":"#00ADD8"},"pullRequestCount":0,"issueCount":0,"starsCount":3,"forksCount":2,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-06-06T10:12:50.098Z"}},{"type":"Public","name":"slurm","owner":"HabanaAI","isFork":true,"description":"Slurm: A Highly Scalable Workload Manager","allTopics":[],"primaryLanguage":{"name":"C","color":"#555555"},"pullRequestCount":1,"issueCount":0,"starsCount":2,"forksCount":655,"license":"Other","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-05-20T16:07:55.034Z"}},{"type":"Public","name":"Gaudi-solutions","owner":"HabanaAI","isFork":false,"description":"Full End-to-End examples showing how to use First-gen Gaudi and Gaudi2 in common use cases","allTopics":[],"primaryLanguage":{"name":"Jupyter Notebook","color":"#DA5B0B"},"pullRequestCount":0,"issueCount":0,"starsCount":9,"forksCount":4,"license":"Apache License 2.0","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2024-04-19T22:25:03.635Z"}},{"type":"Public","name":"deepspeed_old","owner":"HabanaAI","isFork":false,"description":"","allTopics":[],"primaryLanguage":{"name":"Python","color":"#3572A5"},"pullRequestCount":1,"issueCount":0,"starsCount":6,"forksCount":3,"license":"MIT License","participation":null,"lastUpdated":{"hasBeenPushedTo":true,"timestamp":"2023-07-03T20:00:24.859Z"}}],"repositoryCount":36,"userInfo":null,"searchable":true,"definitions":[],"typeFilters":[{"id":"all","text":"All"},{"id":"public","text":"Public"},{"id":"source","text":"Sources"},{"id":"fork","text":"Forks"},{"id":"archived","text":"Archived"},{"id":"template","text":"Templates"}],"compactMode":false},"title":"HabanaAI repositories"}