Set ollama context lenght in example to 8192 to make it work (#252)
* set ollama context length in example
This commit is contained in:
		
							parent
							
								
									58b18f5655
								
							
						
					
					
						commit
						e30ec8ac91
					
				|  | @ -89,8 +89,9 @@ from smolagents import CodeAgent, LiteLLMModel | ||||||
| 
 | 
 | ||||||
| model = LiteLLMModel( | model = LiteLLMModel( | ||||||
|     model_id="ollama_chat/llama3.2", # This model is a bit weak for agentic behaviours though |     model_id="ollama_chat/llama3.2", # This model is a bit weak for agentic behaviours though | ||||||
|     api_base="http://localhost:11434", # replace with remote open-ai compatible server if necessary |     api_base="http://localhost:11434", # replace with 127.0.0.1:11434 or remote open-ai compatible server if necessary | ||||||
|     api_key="YOUR_API_KEY" # replace with API key if necessary |     api_key="YOUR_API_KEY" # replace with API key if necessary | ||||||
|  |     num_ctx=8192 # ollama default is 2048 which will fail horribly. 8192 works for easy tasks, more is better. Check https://huggingface.co/spaces/NyxKrage/LLM-Model-VRAM-Calculator to calculate how much VRAM this will need for the selected model. | ||||||
| ) | ) | ||||||
| 
 | 
 | ||||||
| agent = CodeAgent(tools=[], model=model, add_base_tools=True) | agent = CodeAgent(tools=[], model=model, add_base_tools=True) | ||||||
|  |  | ||||||
		Loading…
	
		Reference in New Issue