Spaces:

katanaml
/

sparrow-ml

Running

App Files Files Community

sparrow-ml / config.yml

katanaml

Added sparrow key support

dca3ac6 10 months ago

raw

history blame contribute delete

3.26 kB

	PROTECTED_ACCESS: True

	# AGENT FOR LLAMAINDEX
	# Tested with these LLMs
	#LLM: 'starling-lm:7b-alpha-q4_K_M'
	#LLM: 'starling-lm:7b-alpha-q5_K_M'
	LLM: 'adrienbrault/nous-hermes2theta-llama3-8b:q5_K_M'
	#LLM: 'llama3:8b-instruct-q5_K_M'
	EMBEDDINGS: 'sentence-transformers/all-mpnet-base-v2'
	WEAVIATE_URL: 'http://localhost:8080'
	CHUNK_SIZE: 3000
	OLLAMA_BASE_URL: 'http://127.0.0.1:11434'
	#OLLAMA_BASE_URL: 'http://192.168.68.107:11434'


	# AGENT FOR HAYSTACK
	SPLIT_BY_HAYSTACK: 'sentence'
	SPLIT_LENGTH_HAYSTACK: 3000
	SPLIT_OVERLAP_HAYSTACK: 100
	EMBEDDINGS_HAYSTACK: 'sentence-transformers/all-MiniLM-L6-v2'
	# Tested with these LLMs
	#LLM_HAYSTACK: 'starling-lm:7b-alpha-q4_K_M'
	#LLM_HAYSTACK: 'starling-lm:7b-alpha-q5_K_M'
	LLM_HAYSTACK: 'adrienbrault/nous-hermes2theta-llama3-8b:q5_K_M'
	#LLM_HAYSTACK: 'llama3:8b-instruct-q5_K_M'
	OLLAMA_BASE_URL_HAYSTACK: 'http://127.0.0.1:11434'
	#OLLAMA_BASE_URL_HAYSTACK: 'http://192.168.68.107:11434'
	MAX_LOOPS_ALLOWED_HAYSTACK: 3


	# AGENT FOR VLLAMAINDEX
	# Tested with these LLMs
	LLM_VLLAMAINDEX: 'llava:13b'


	# AGENT FOR VPROCESSOR
	OCR_ENDPOINT_VPROCESSOR: 'http://127.0.0.1:8001/api/v1/sparrow-ocr/inference'
	# Tested with these LLMs
	#LLM_VPROCESSOR: 'starling-lm:7b-alpha-q5_K_M'
	#LLM_VPROCESSOR: 'adrienbrault/nous-hermes2pro:Q5_K_M-json'
	LLM_VPROCESSOR: 'llama3:8b-instruct-q5_K_M'
	OLLAMA_BASE_URL_VPROCESSOR: 'http://127.0.0.1:11434'


	# AGENT FOR FUNCTION CALL
	OLLAMA_BASE_URL_FUNCTION: 'http://127.0.0.1:11434/v1'
	# Tested with these LLMs
	LLM_FUNCTION: 'adrienbrault/nous-hermes2theta-llama3-8b:q5_K_M'


	# AGENT FOR UNSTRUCTURED LIGHT
	# Tested with these LLMs
	LLM_UNSTRUCTURED_LIGHT: 'adrienbrault/nous-hermes2pro:Q5_K_M-json'
	# Strategy for analyzing PDFs and extracting table structure
	STRATEGY_UNSTRUCTURED_LIGHT: 'hi_res'
	# Best model for table extraction. Other options are detectron2_onnx and chipper depending on file layout
	MODEL_UNSTRUCTURED_LIGHT: 'yolox'
	CHUNK_SIZE_UNSTRUCTURED_LIGHT: 1000
	OVERLAP_UNSTRUCTURED_LIGHT: 200
	# ollama pull nomic-embed-text
	EMBEDDINGS_UNSTRUCTURED_LIGHT: 'nomic-embed-text'
	BASE_URL_UNSTRUCTURED_LIGHT: 'http://127.0.0.1:11434'


	# AGENT FOR UNSTRUCTURED
	# Tested with these LLMs
	LLM_UNSTRUCTURED: 'adrienbrault/nous-hermes2pro:Q5_K_M-json'
	OUTPUT_DIR_UNSTRUCTURED: 'data/json'
	INPUT_DIR_UNSTRUCTURED: 'data/pdf'
	WEAVIATE_URL_UNSTRUCTURED: 'http://localhost:8080'
	EMBEDDINGS_UNSTRUCTURED: 'all-MiniLM-L6-v2'
	DEVICE_UNSTRUCTURED: 'cpu'
	CHUNK_UNDER_N_CHARS_UNSTRUCTURED: 250
	CHUNK_NEW_AFTER_N_CHARS_UNSTRUCTURED: 500
	BASE_URL_UNSTRUCTURED: 'http://127.0.0.1:11434'


	# AGENT FOR INSTRUCTOR
	OLLAMA_BASE_URL_INSTRUCTOR: 'http://127.0.0.1:11434/v1'
	#OLLAMA_BASE_URL_INSTRUCTOR: 'http://192.168.68.107:11434/v1'
	# Tested with these LLMs
	LLM_INSTRUCTOR: 'adrienbrault/nous-hermes2theta-llama3-8b:q5_K_M'
	#LLM_INSTRUCTOR: 'adrienbrault/nous-hermes2pro:Q5_K_M-json'
	#LLM_INSTRUCTOR: 'wizardlm2:7b-q5_K_M'
	# Strategy for analyzing PDFs and extracting table structure
	STRATEGY_INSTRUCTOR: 'hi_res'
	# Using yolox model by default. Other option is detectron2_onnx, depending on file layout
	MODEL_INSTRUCTOR: 'yolox'
	SIMILARITY_THRESHOLD_JUNK_COLUMNS_INSTRUCTOR: 0.5
	SIMILARITY_THRESHOLD_COLUMN_ID_INSTRUCTOR: 0.3
	PDF_SPLIT_OUTPUT_DIR_INSTRUCTOR: ""
	PDF_CONVERT_TO_IMAGES_INSTRUCTOR: False