{"payload":{"header_redesign_enabled":false,"results":[{"id":"744514418","archived":false,"color":"#3572A5","followers":489,"has_funding_file":false,"hl_name":"IST-DASLab/marlin","hl_trunc_description":"FP16xINT4 LLM inference kernel that can achieve near-ideal ~4x speedups up to medium batchsizes of 16-32 tokens.","language":"Python","mirror":false,"owned_by_organization":true,"public":true,"repo":{"repository":{"id":744514418,"name":"marlin","owner_id":35098403,"owner_login":"IST-DASLab","updated_at":"2024-07-10T03:28:13.078Z","has_issues":true}},"sponsorable":false,"topics":["kernel","quantization","4bit","llm"],"type":"Public","help_wanted_issues_count":0,"good_first_issue_issues_count":0,"starred_by_current_user":false}],"type":"repositories","page":1,"page_count":1,"elapsed_millis":54,"errors":[],"result_count":1,"facets":[],"protected_org_logins":[],"topics":null,"query_id":"","logged_in":false,"sign_up_path":"/signup?source=code_search_results","sign_in_path":"/login?return_to=https%3A%2F%2Fgithub.com%2Fsearch%3Fq%3Drepo%253AIST-DASLab%252Fmarlin%2B%2Blanguage%253APython","metadata":null,"csrf_tokens":{"/IST-DASLab/marlin/star":{"post":"AlhSNVPz5PsyuSW0ewDAFqK_tODHtYHsHzyyFv3S_w1CU0jttawLpvHaiW6_i1qnHfkYK0ap__33NcnUIxyNZA"},"/IST-DASLab/marlin/unstar":{"post":"g2nysvF3aJNmUmkiFxvCNznfAxfuP-tUggfTAzaW5edSO4h5_WL6qA8u1llMyBzhHTmQdCOClOnycZCukjJRhQ"},"/sponsors/batch_deferred_sponsor_buttons":{"post":"gLGiwdxQGjJiYdnlE45XAugx8LVsUQZc8F2kMOwL6LHFb7oJ7OcOCMtxlwePJcJilJLWcqcXfN2X0GsvoIzSZA"}}},"title":"Repository search results"}