{"users":[{"id":2,"username":"Coby","avatar_template":"/user_avatar/community.sambanova.ai/coby/{size}/17_2.png","flair_name":"SambaNova-Employee","flair_url":"https://us1.discourse-cdn.com/sambanova/original/2X/d/dcb40fb85fe3a51eb4d4fc429f5c5eed363140a3.png","flair_group_id":45,"admin":true,"moderator":true,"trust_level":4},{"id":161,"username":"shivani.moze","avatar_template":"/user_avatar/community.sambanova.ai/shivani.moze/{size}/2802_2.png","flair_name":"SambaNova-Employee","flair_url":"https://us1.discourse-cdn.com/sambanova/original/2X/d/dcb40fb85fe3a51eb4d4fc429f5c5eed363140a3.png","flair_group_id":45,"admin":true,"moderator":true,"trust_level":3},{"id":156,"username":"saurabh.patil","avatar_template":"/user_avatar/community.sambanova.ai/saurabh.patil/{size}/1908_2.png","flair_name":"SambaNova-Employee","flair_url":"https://us1.discourse-cdn.com/sambanova/original/2X/d/dcb40fb85fe3a51eb4d4fc429f5c5eed363140a3.png","flair_group_id":45,"moderator":true,"trust_level":3},{"id":47,"username":"prafull.thokal","avatar_template":"/user_avatar/community.sambanova.ai/prafull.thokal/{size}/20_2.png","flair_name":"SambaNova-Employee","flair_url":"https://us1.discourse-cdn.com/sambanova/original/2X/d/dcb40fb85fe3a51eb4d4fc429f5c5eed363140a3.png","flair_group_id":45,"moderator":true,"trust_level":3},{"id":157,"username":"Rohit.Vyawahare","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/r/8dc957/{size}.png","flair_name":"SambaNova-Employee","flair_url":"https://us1.discourse-cdn.com/sambanova/original/2X/d/dcb40fb85fe3a51eb4d4fc429f5c5eed363140a3.png","flair_group_id":45,"trust_level":3},{"id":48,"username":"durgesh.ojha","avatar_template":"/user_avatar/community.sambanova.ai/durgesh.ojha/{size}/413_2.png","flair_name":"SambaNova-Employee","flair_url":"https://us1.discourse-cdn.com/sambanova/original/2X/d/dcb40fb85fe3a51eb4d4fc429f5c5eed363140a3.png","flair_group_id":45,"admin":true,"moderator":true,"trust_level":3},{"id":159,"username":"prajwal.balapure","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/p/a9a28c/{size}.png","flair_name":"SambaNova-Employee","flair_url":"https://us1.discourse-cdn.com/sambanova/original/2X/d/dcb40fb85fe3a51eb4d4fc429f5c5eed363140a3.png","flair_group_id":45,"moderator":true,"trust_level":3},{"id":158,"username":"omkar.gangan","avatar_template":"/user_avatar/community.sambanova.ai/omkar.gangan/{size}/217_2.png","flair_name":"SambaNova-Employee","flair_url":"https://us1.discourse-cdn.com/sambanova/original/2X/d/dcb40fb85fe3a51eb4d4fc429f5c5eed363140a3.png","flair_group_id":45,"admin":true,"moderator":true,"trust_level":3},{"id":189,"username":"ankit.agrawal","avatar_template":"https://avatars.discourse-cdn.com/v4/letter/a/bc79bd/{size}.png","moderator":true,"trust_level":3}],"primary_groups":[],"flair_groups":[{"id":45,"name":"SambaNova-Employee","flair_url":"https://us1.discourse-cdn.com/sambanova/original/2X/d/dcb40fb85fe3a51eb4d4fc429f5c5eed363140a3.png","flair_bg_color":"","flair_color":""}],"topic_list":{"can_create_topic":false,"more_topics_url":"/c/ka/83?page=1","per_page":30,"top_tags":[{"id":32,"name":"support-knowledge","slug":"support-knowledge"},{"id":38,"name":"cloud","slug":"cloud"},{"id":48,"name":"sambanova-suite","slug":"sambanova-suite"},{"id":18,"name":"doc","slug":"doc"},{"id":49,"name":"on-prem","slug":"on-prem"},{"id":51,"name":"ai","slug":"ai"},{"id":30,"name":"billing","slug":"billing"},{"id":47,"name":"contact","slug":"contact"},{"id":44,"name":"debugging","slug":"debugging"},{"id":55,"name":"dify","slug":"dify"},{"id":8,"name":"function_calling","slug":"function-calling"},{"id":27,"name":"inference","slug":"inference"},{"id":13,"name":"support","slug":"support"},{"id":50,"name":"text-generation","slug":"text-generation"},{"id":28,"name":"troubleshooting","slug":"troubleshooting"},{"id":31,"name":"ui","slug":"ui"}],"topics":[{"fancy_title":"About the Knowledge Articles category","id":873,"title":"About the Knowledge Articles category","slug":"about-the-knowledge-articles-category","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-02-04T02:58:09.062Z","last_posted_at":"2025-02-04T02:58:09.067Z","bumped":true,"bumped_at":"2025-05-30T13:54:05.962Z","archetype":"regular","unseen":false,"pinned":true,"unpinned":null,"excerpt":"This section will contain general Knowledge Articles created primarily form the SambaNova Support team.  It will contain articles for both Cloud based and on premises products.","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":23,"like_count":0,"has_summary":false,"last_poster_username":"Coby","category_id":83,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":2,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Agentic RAG: Think–Act–Retrieve–Answer","id":1316,"title":"Agentic RAG: Think–Act–Retrieve–Answer","slug":"agentic-rag-think-act-retrieve-answer","posts_count":2,"reply_count":0,"highest_post_number":2,"image_url":"https://us1.discourse-cdn.com/sambanova/original/2X/a/a7415f4a88a02015cfdecc206a3c953f565625a7.jpeg","created_at":"2025-08-19T03:19:36.384Z","last_posted_at":"2025-08-19T03:34:07.182Z","bumped":true,"bumped_at":"2025-08-19T03:34:07.182Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Introduction\nLarge Language Models (LLMs) are powerful, but they face inherent limitations such as outdated knowledge, hallucinations, and an inability to access private or real-time data. Retrieval-Augmented Generation &hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":32,"name":"support-knowledge","slug":"support-knowledge"}],"tags_descriptions":{},"views":108,"like_count":9,"has_summary":false,"last_poster_username":"Coby","category_id":83,"op_like_count":5,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":161,"primary_group_id":null,"flair_group_id":45},{"extras":"latest","description":"Most Recent Poster","user_id":2,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Why do I see a monetary value for &ldquo;Usage&rdquo; data that exists before the Development Tier launch?","id":902,"title":"Why do I see a monetary value for \"Usage\" data that exists before the Development Tier launch?","slug":"why-do-i-see-a-monetary-value-for-usage-data-that-exists-before-the-development-tier-launch","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":"https://us1.discourse-cdn.com/sambanova/optimized/2X/a/a0e38c2674336b142809a7654079949a29bdbf99_2_1024x309.png","created_at":"2025-02-08T21:33:50.840Z","last_posted_at":"2025-02-08T21:33:50.931Z","bumped":true,"bumped_at":"2025-07-30T07:33:03.882Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"While Navigating the SambaCloud user interface you may notice that in your Usage section that you will see Usage data reflecting an associated dollar value from before the February 8th 2025 date . \n  \nWe did this in orde&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":32,"name":"support-knowledge","slug":"support-knowledge"},{"id":31,"name":"ui","slug":"ui"},{"id":30,"name":"billing","slug":"billing"}],"tags_descriptions":{},"views":90,"like_count":3,"has_summary":false,"last_poster_username":"Coby","category_id":83,"op_like_count":3,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":2,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"SambaCloud Integration with Dify:","id":1276,"title":"SambaCloud Integration with Dify:","slug":"sambacloud-integration-with-dify","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-07-23T06:32:54.262Z","last_posted_at":"2025-07-23T06:32:54.396Z","bumped":true,"bumped_at":"2025-07-30T07:30:39.020Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":":pushpin: Overview\nThis document explains how to integrate SambaCloud LLMs into the Dify AI application platform. Dify enables fast development of LLM apps with a no-code/low-code approach. \n:puzzle_piece: What is Dify?\nD&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":38,"name":"cloud","slug":"cloud"},{"id":55,"name":"dify","slug":"dify"}],"tags_descriptions":{},"views":44,"like_count":2,"has_summary":false,"last_poster_username":"saurabh.patil","category_id":83,"op_like_count":2,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":156,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"🛠️ Standardized API Calling Templates for SambaCloud Models","id":1278,"title":"🛠️ Standardized API Calling Templates for SambaCloud Models","slug":"standardized-api-calling-templates-for-sambacloud-models","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-07-24T09:44:45.730Z","last_posted_at":"2025-07-24T09:44:45.880Z","bumped":true,"bumped_at":"2025-07-30T07:23:40.216Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"This document outlines standardized calling templates for all model offerings in SambaCloud, categorized by modality and capability. It includes key differences between each API usage pattern to ensure clarity and consis&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":43,"like_count":3,"has_summary":false,"last_poster_username":"prafull.thokal","category_id":83,"op_like_count":3,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":47,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"SambaCloud Dashboard Overview","id":1287,"title":"SambaCloud Dashboard Overview","slug":"sambacloud-dashboard-overview","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":"https://us1.discourse-cdn.com/sambanova/optimized/2X/9/9b77825954d840dba14184be015cdb65d76e2e34_2_1024x547.jpeg","created_at":"2025-07-30T05:18:24.563Z","last_posted_at":"2025-07-30T05:18:24.696Z","bumped":true,"bumped_at":"2025-07-30T07:20:50.563Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Purpose:\nThis page provides a high-level overview of the SambaCloud Dashboard. \nDashboard Overview:\nThe SambaCloud Dashboard is a user-friendly interface that provides access to various tools and features for working wit&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":32,"name":"support-knowledge","slug":"support-knowledge"}],"tags_descriptions":{},"views":32,"like_count":1,"has_summary":false,"last_poster_username":"Rohit.Vyawahare","category_id":83,"op_like_count":1,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":157,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Model Context Protocol (MCP) Servers","id":1285,"title":"Model Context Protocol (MCP) Servers","slug":"model-context-protocol-mcp-servers","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-07-29T13:22:27.688Z","last_posted_at":"2025-07-29T13:22:27.811Z","bumped":true,"bumped_at":"2025-07-29T13:22:27.811Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Overview\nModel Context Protocol (MCP) servers are components in a machine learning infrastructure that manage the contextual information needed to execute models efficiently. MCP servers maintain session states, model we&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":18,"name":"doc","slug":"doc"}],"tags_descriptions":{},"views":47,"like_count":2,"has_summary":false,"last_poster_username":"durgesh.ojha","category_id":83,"op_like_count":2,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":48,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"A Step-by-Step Guide to AI Inference Using Oumi and SambaNova","id":1284,"title":"A Step-by-Step Guide to AI Inference Using Oumi and SambaNova","slug":"a-step-by-step-guide-to-ai-inference-using-oumi-and-sambanova","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-07-29T11:51:31.676Z","last_posted_at":"2025-07-29T11:51:31.794Z","bumped":true,"bumped_at":"2025-07-29T11:51:31.794Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What is Oumi? \nOumi is an open-source AI development platform for training, fine-tuning, deploying, evaluating, and serving large language models (LLMs). \nIt supports models like LLaMA, Mistral, OpenHermes, TinyLlama, an&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":32,"name":"support-knowledge","slug":"support-knowledge"}],"tags_descriptions":{},"views":49,"like_count":3,"has_summary":false,"last_poster_username":"shivani.moze","category_id":83,"op_like_count":3,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":161,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Core Concepts Behind Large Language Models (LLMs)","id":1283,"title":"Core Concepts Behind Large Language Models (LLMs)","slug":"core-concepts-behind-large-language-models-llms","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-07-29T07:19:12.345Z","last_posted_at":"2025-07-29T07:19:12.530Z","bumped":true,"bumped_at":"2025-07-29T07:19:12.530Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What is a Large Language Model?\nA Large Language Model (LLM) is a type of artificial intelligence trained to understand and generate human language. LLMs like Meta-Llama-3.3-70B-Instruct and \nLlama-4-Maverick-17B-128E-In&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":32,"name":"support-knowledge","slug":"support-knowledge"}],"tags_descriptions":{},"views":36,"like_count":2,"has_summary":false,"last_poster_username":"shivani.moze","category_id":83,"op_like_count":2,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":161,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Shape the Future of AI—Join the SambaNova Community Movement!","id":1238,"title":"Shape the Future of AI—Join the SambaNova Community Movement!","slug":"shape-the-future-of-ai-join-the-sambanova-community-movement","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":"https://us1.discourse-cdn.com/sambanova/optimized/2X/6/68e40261f0b031920d3e52a1143a9e01e1cd1b2f_2_1024x150.png","created_at":"2025-06-27T10:37:12.962Z","last_posted_at":"2025-06-27T10:37:13.099Z","bumped":true,"bumped_at":"2025-06-27T10:37:13.099Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Introduction: \nWelcome to the vibrant world of SambaNova! \nHere, we don’t just use AI—we shape it. Our community thrives on shared knowledge, collaboration, and bold innovation. \nThis space is designed to empower YOU—whe&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":32,"like_count":1,"has_summary":false,"last_poster_username":"durgesh.ojha","category_id":83,"op_like_count":1,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":48,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"An Introduction to Cline: Your AI-Powered Development Assistant in VS Code","id":1237,"title":"An Introduction to Cline: Your AI-Powered Development Assistant in VS Code","slug":"an-introduction-to-cline-your-ai-powered-development-assistant-in-vs-code","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-06-27T10:27:39.894Z","last_posted_at":"2025-06-27T10:27:40.015Z","bumped":true,"bumped_at":"2025-06-27T10:27:40.015Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What is Cline?\nCline is an intelligent, AI-powered development assistant seamlessly integrated into Visual Studio Code (VS Code). Designed to enhance productivity, reduce context-switching, and supercharge your coding wo&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":131,"like_count":2,"has_summary":false,"last_poster_username":"durgesh.ojha","category_id":83,"op_like_count":2,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":48,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Unlocking AI Innovation: Leveraging SambaNova APIs","id":1236,"title":"Unlocking AI Innovation: Leveraging SambaNova APIs","slug":"unlocking-ai-innovation-leveraging-sambanova-apis","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-06-27T10:25:15.841Z","last_posted_at":"2025-06-27T10:25:15.965Z","bumped":true,"bumped_at":"2025-06-27T10:25:15.965Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Introduction\nThe rapid evolution of Artificial Intelligence (AI) has transformed the way businesses operate, innovate, and deliver value to their customers. As AI continues to advance, organizations are seeking ways to h&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":39,"like_count":2,"has_summary":false,"last_poster_username":"durgesh.ojha","category_id":83,"op_like_count":2,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":48,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Knowledge Distillation in Large Language Models","id":1233,"title":"Knowledge Distillation in Large Language Models","slug":"knowledge-distillation-in-large-language-models","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-06-25T02:21:49.502Z","last_posted_at":"2025-06-25T02:21:49.669Z","bumped":true,"bumped_at":"2025-06-25T02:21:49.669Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Introduction\nLLM Distillation is a specialized form of Knowledge Distillation (KD) aimed at compressing large-scale language models while preserving their performance. It enables smaller, more efficient models to approxi&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":32,"name":"support-knowledge","slug":"support-knowledge"},{"id":51,"name":"ai","slug":"ai"}],"tags_descriptions":{},"views":87,"like_count":2,"has_summary":false,"last_poster_username":"prajwal.balapure","category_id":83,"op_like_count":2,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":159,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"A Deep Dive into Reasoning Models","id":1208,"title":"A Deep Dive into Reasoning Models","slug":"a-deep-dive-into-reasoning-models","posts_count":2,"reply_count":0,"highest_post_number":2,"image_url":null,"created_at":"2025-06-20T06:09:30.780Z","last_posted_at":"2025-06-20T13:58:16.364Z","bumped":true,"bumped_at":"2025-06-20T13:58:16.364Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Introduction: What Are Reasoning Models?\nA reasoning model is a type of large language model (LLM) that can perform complex reasoning tasks. Instead of quickly generating output based solely on a statistical guess of wha&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":32,"name":"support-knowledge","slug":"support-knowledge"}],"tags_descriptions":{},"views":91,"like_count":4,"has_summary":false,"last_poster_username":"omkar.gangan","category_id":83,"op_like_count":3,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":159,"primary_group_id":null,"flair_group_id":45},{"extras":"latest","description":"Most Recent Poster","user_id":158,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"What Is Multimodal RAG? Simple Guide Using Sambanova APIs and models","id":1207,"title":"What Is Multimodal RAG? Simple Guide Using Sambanova APIs and models","slug":"what-is-multimodal-rag-simple-guide-using-sambanova-apis-and-models","posts_count":2,"reply_count":0,"highest_post_number":2,"image_url":null,"created_at":"2025-06-20T06:01:46.269Z","last_posted_at":"2025-06-20T13:48:46.700Z","bumped":true,"bumped_at":"2025-06-20T13:48:46.700Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What Is Multimodal RAG?\nMultimodal RAG = Retrieval-Augmented Generation that works with more than just text, like images, PDFs, audio, or videos.\nThink of it like this: \nA smart assistant that can search through not just&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":32,"name":"support-knowledge","slug":"support-knowledge"},{"id":18,"name":"doc","slug":"doc"}],"tags_descriptions":{},"views":95,"like_count":3,"has_summary":false,"last_poster_username":"omkar.gangan","category_id":83,"op_like_count":2,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":161,"primary_group_id":null,"flair_group_id":45},{"extras":"latest","description":"Most Recent Poster","user_id":158,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"How to activate the endpoint for COE bundles","id":1205,"title":"How to activate the endpoint for COE bundles","slug":"how-to-activate-the-endpoint-for-coe-bundles","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":"https://us1.discourse-cdn.com/sambanova/optimized/2X/6/6a806eb0fa701e5d6a0b038bf06914ed025fcd30_2_1024x424.png","created_at":"2025-06-19T03:50:31.341Z","last_posted_at":"2025-06-19T03:50:31.459Z","bumped":true,"bumped_at":"2025-06-19T03:53:27.749Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Purpose:\nThe purpose of this page is to provide a step-by-step guide on creating COE bundles in Studio. COE bundles are pre-configured templates that enable organizations to standardize and accelerate their development p&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":32,"name":"support-knowledge","slug":"support-knowledge"},{"id":48,"name":"sambanova-suite","slug":"sambanova-suite"}],"tags_descriptions":{},"views":40,"like_count":3,"has_summary":false,"last_poster_username":"Rohit.Vyawahare","category_id":83,"op_like_count":3,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":157,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Function Calling &amp; JSON Mode in SambaNova Cloud","id":1196,"title":"Function Calling & JSON Mode in SambaNova Cloud","slug":"function-calling-json-mode-in-sambanova-cloud","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-06-15T05:43:12.630Z","last_posted_at":"2025-06-15T05:43:12.762Z","bumped":true,"bumped_at":"2025-06-15T05:43:12.762Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Overview:\nSambaNova Cloud supports advanced function-calling capabilities that enable structured, tool-augmented responses. This allows you to build more dynamic, context-aware applications that can interface directly wi&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":8,"name":"function_calling","slug":"function-calling"},{"id":38,"name":"cloud","slug":"cloud"}],"tags_descriptions":{},"views":40,"like_count":4,"has_summary":false,"last_poster_username":"saurabh.patil","category_id":83,"op_like_count":4,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":156,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"SambaNova Text Generation","id":1195,"title":"SambaNova Text Generation","slug":"sambanova-text-generation","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-06-15T05:23:40.654Z","last_posted_at":"2025-06-15T05:23:40.786Z","bumped":true,"bumped_at":"2025-06-15T05:23:40.786Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Overview:\nSambaNova Cloud offers advanced text generation capabilities via an OpenAI-compatible API interface. Supported modes include: \n\n:white_check_mark: Non-Streaming (standard)\n:counterclockwise_arrows_button: Strea&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":38,"name":"cloud","slug":"cloud"},{"id":50,"name":"text-generation","slug":"text-generation"}],"tags_descriptions":{},"views":34,"like_count":2,"has_summary":false,"last_poster_username":"saurabh.patil","category_id":83,"op_like_count":2,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":156,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"How to create COE bundles in studio","id":1176,"title":"How to create COE bundles in studio","slug":"how-to-create-coe-bundles-in-studio","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":"https://us1.discourse-cdn.com/sambanova/optimized/2X/0/0d2da3e30cf391e5014240b974b6535c3968ee63_2_1024x424.png","created_at":"2025-06-01T18:58:46.170Z","last_posted_at":"2025-06-01T18:58:46.327Z","bumped":true,"bumped_at":"2025-06-01T18:58:46.327Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Purpose:\nThe purpose of this page is to provide a step-by-step guide on creating COE bundles in Studio. COE bundles are pre-configured templates that enable organizations to standardize and accelerate their development p&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":48,"name":"sambanova-suite","slug":"sambanova-suite"},{"id":49,"name":"on-prem","slug":"on-prem"}],"tags_descriptions":{},"views":74,"like_count":0,"has_summary":false,"last_poster_username":"Rohit.Vyawahare","category_id":83,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":157,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Image Classification with SambaStudio","id":1171,"title":"Image Classification with SambaStudio","slug":"image-classification-with-sambastudio","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-05-30T09:38:09.244Z","last_posted_at":"2025-05-30T09:38:09.353Z","bumped":true,"bumped_at":"2025-05-30T13:52:05.580Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Overview:\nThis document explains how to perform image classification using the Vit_B_Classification model in SambaStudio. Image classification is the process of assigning labels to images from a set of predefined classes&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":48,"name":"sambanova-suite","slug":"sambanova-suite"},{"id":49,"name":"on-prem","slug":"on-prem"}],"tags_descriptions":{},"views":49,"like_count":1,"has_summary":false,"last_poster_username":"saurabh.patil","category_id":83,"op_like_count":1,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":156,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"All about Speculative Decoding","id":1172,"title":"All about Speculative Decoding","slug":"all-about-speculative-decoding","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":"https://us1.discourse-cdn.com/sambanova/optimized/2X/4/409e3ea738afa8722bf667eb3b0d4e0bc74eacf2_2_1024x546.avif","created_at":"2025-05-30T09:52:36.478Z","last_posted_at":"2025-05-30T09:52:36.611Z","bumped":true,"bumped_at":"2025-05-30T09:52:36.611Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Speculative Decoding (SD) is a token generation acceleration technique where a faster, smaller draft model proposes future tokens, which are then validated by a larger, accurate target model. This approach significantly &hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":58,"like_count":0,"has_summary":false,"last_poster_username":"prajwal.balapure","category_id":83,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":159,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Unlocking the Power of AI: A Deep Dive into Available Models on SambaNova Cloud","id":1170,"title":"Unlocking the Power of AI: A Deep Dive into Available Models on SambaNova Cloud","slug":"unlocking-the-power-of-ai-a-deep-dive-into-available-models-on-sambanova-cloud","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-05-30T07:33:48.258Z","last_posted_at":"2025-05-30T07:33:48.477Z","bumped":true,"bumped_at":"2025-05-30T07:33:48.477Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":":rocket: Overview:\nThe SambaNova Cloud is purpose-built to accelerate AI workloads powered by SambaNova RDUs, empowering enterprises to deploy, fine-tune, and scale cutting-edge models with ease. Whether you’re building &hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":208,"like_count":0,"has_summary":false,"last_poster_username":"prafull.thokal","category_id":83,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":47,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Fundamentals of RAG (Retrieval-Augmented Generation)","id":1169,"title":"Fundamentals of RAG (Retrieval-Augmented Generation)","slug":"fundamentals-of-rag-retrieval-augmented-generation","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-05-30T06:57:46.518Z","last_posted_at":"2025-05-30T06:57:46.659Z","bumped":true,"bumped_at":"2025-05-30T06:57:46.659Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"What is RAG?\nRAG = Retrieval + Generation \nInstead of just generating answers from a fixed model, RAG: \n\nRetrieves relevant information (e.g., from documents, PDFs, or databases)\nAugments the user prompt with the retriev&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":51,"like_count":1,"has_summary":false,"last_poster_username":"shivani.moze","category_id":83,"op_like_count":1,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":161,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"PulseProbe – Your CLI Companion for Model Visibility on SambaNova Cloud","id":1164,"title":"PulseProbe – Your CLI Companion for Model Visibility on SambaNova Cloud","slug":"pulseprobe-your-cli-companion-for-model-visibility-on-sambanova-cloud","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-05-29T13:38:35.385Z","last_posted_at":"2025-05-29T13:38:35.596Z","bumped":true,"bumped_at":"2025-05-29T13:54:09.827Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":":books: Context\nModern AI applications often leverage multiple large language models (LLMs) deployed via cloud APIs like SambaNova Cloud. For seamless development and troubleshooting, it’s essential to maintain clear vis&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":73,"like_count":0,"has_summary":false,"last_poster_username":"prafull.thokal","category_id":83,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":47,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"SambaNova Support Phone Numbers","id":1139,"title":"SambaNova Support Phone Numbers","slug":"sambanova-support-phone-numbers","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-05-21T17:34:33.527Z","last_posted_at":"2025-05-21T17:34:33.623Z","bumped":true,"bumped_at":"2025-05-21T17:34:33.623Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"SambaNova Support Phone Numbers: \n\n\nUSA +1(888) 490-0590 \n\n\nHungary +3618088012 \n\n\nUK +44 800 368 5473 \n\n\nJapan +81 50-5785-0264 \n\n\nSweden +46 8 502 457 87","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":47,"name":"contact","slug":"contact"},{"id":13,"name":"support","slug":"support"}],"tags_descriptions":{},"views":54,"like_count":6,"has_summary":false,"last_poster_username":"Coby","category_id":83,"op_like_count":6,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":2,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Developing a Linux Command Generator using Sambanova&rsquo;s API","id":1108,"title":"Developing a Linux Command Generator using Sambanova's API","slug":"developing-a-linux-command-generator-using-sambanovas-api","posts_count":2,"reply_count":0,"highest_post_number":2,"image_url":null,"created_at":"2025-05-08T18:36:11.481Z","last_posted_at":"2025-05-09T07:37:02.962Z","bumped":true,"bumped_at":"2025-05-09T07:37:02.962Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Introduction \nThis guide walks you through creating a Linux Command Generator using Sambanova’s API, a tool that bridges the gap between human language and terminal expertise. \nNavigating Linux commands can be daunting, &hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":68,"like_count":3,"has_summary":false,"last_poster_username":"shivani.moze","category_id":83,"op_like_count":2,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":null,"description":"Original Poster","user_id":158,"primary_group_id":null,"flair_group_id":45},{"extras":"latest","description":"Most Recent Poster","user_id":161,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Extracting chat completion ID ( request ID)","id":1095,"title":"Extracting chat completion ID ( request ID)","slug":"extracting-chat-completion-id-request-id","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-04-30T20:23:52.365Z","last_posted_at":"2025-04-30T20:23:52.466Z","bumped":true,"bumped_at":"2025-04-30T20:23:52.466Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Extracting Chat Completion ID\nIntroduction\nThe chat completion ID is a unique identifier generated by the OpenAI API for each chat completion request. \nExtracting the ID\nTo extract the chat completion ID, you can access &hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":27,"name":"inference","slug":"inference"},{"id":44,"name":"debugging","slug":"debugging"}],"tags_descriptions":{},"views":77,"like_count":0,"has_summary":false,"last_poster_username":"Coby","category_id":83,"op_like_count":0,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":2,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Behavior of &lt;think&gt; Tag in QwQ-32B Model Responses","id":1059,"title":"Behavior of <think> Tag in QwQ-32B Model Responses","slug":"behavior-of-think-tag-in-qwq-32b-model-responses","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2025-04-16T02:35:56.888Z","last_posted_at":"2025-04-16T02:35:56.989Z","bumped":true,"bumped_at":"2025-04-16T02:35:56.989Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Issue Summary: \nUsers may observe that responses from the QwQ-32B model (also referred to as the “thinking model”) contain a closing &lt;/think&gt; tag without a corresponding opening &lt;think&gt; tag. This may cause issues in pars&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":95,"like_count":4,"has_summary":false,"last_poster_username":"durgesh.ojha","category_id":83,"op_like_count":4,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":48,"primary_group_id":null,"flair_group_id":45}]},{"fancy_title":"Gradio compatibility","id":427,"title":"Gradio compatibility","slug":"gradio-compatibility","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":"https://us1.discourse-cdn.com/sambanova/original/1X/01f7e7088039049b6d5b54a2707785ba0018012c.png","created_at":"2024-10-09T03:07:10.421Z","last_posted_at":"2024-10-09T03:07:10.542Z","bumped":true,"bumped_at":"2025-02-19T22:20:50.268Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Gradio is the fastest way easily create machine learning applications with a user-friendly web interface powered by SambaNova’s Inference API. \nInstallation\npip install sambanova-gradio==0.1.0\n\nBasic Usage\nJust like if y&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[{"id":32,"name":"support-knowledge","slug":"support-knowledge"}],"tags_descriptions":{},"views":242,"like_count":7,"has_summary":false,"last_poster_username":"ankit.agrawal","category_id":83,"op_like_count":7,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":189,"primary_group_id":null,"flair_group_id":null}]},{"fancy_title":"Function Calling and JSON mode in SambaNova Cloud","id":540,"title":"Function Calling and JSON mode in SambaNova Cloud","slug":"function-calling-and-json-mode-in-sambanova-cloud","posts_count":1,"reply_count":0,"highest_post_number":1,"image_url":null,"created_at":"2024-11-07T05:01:28.650Z","last_posted_at":"2024-11-07T05:01:28.786Z","bumped":true,"bumped_at":"2025-02-19T22:20:21.700Z","archetype":"regular","unseen":false,"pinned":false,"unpinned":null,"excerpt":"Function Calling\nThe SN Cloud Function-Calling API enables dynamic workflows by allowing the model to select and suggest function calls based on user input, which can help you build agentic workflows. By defining a set o&hellip;","visible":true,"closed":false,"archived":false,"bookmarked":null,"liked":null,"tags":[],"tags_descriptions":{},"views":2026,"like_count":5,"has_summary":false,"last_poster_username":"ankit.agrawal","category_id":83,"op_like_count":5,"pinned_globally":false,"featured_link":null,"has_accepted_answer":false,"can_vote":false,"posters":[{"extras":"latest single","description":"Original Poster, Most Recent Poster","user_id":189,"primary_group_id":null,"flair_group_id":null}]}]}}