Skip to content

Commit

Permalink
default context size increased to 2048
Browse files Browse the repository at this point in the history
  • Loading branch information
mgonzs13 committed Dec 12, 2023
1 parent 693f616 commit 9ddeef2
Show file tree
Hide file tree
Showing 5 changed files with 10 additions and 10 deletions.
4 changes: 2 additions & 2 deletions README.md
Original file line number Diff line number Diff line change
Expand Up @@ -33,11 +33,11 @@ def generate_launch_description():

return LaunchDescription([
create_llama_launch(
n_ctx=512, # context of the LLM in tokens
n_ctx=2048, # context of the LLM in tokens
n_batch=8, # batch size in tokens
n_gpu_layers=0, # layers to load in GPU
n_threads=4, # threads
n_predict=512, # max tokens (prompt tokens + predicted tokens
n_predict=2048, # max tokens (prompt tokens + predicted tokens). -1 == inf

model_repo="TheBloke/Marcoroni-7B-v3-GGUF", # Hugging Face repo
model_filename="marcoroni-7b-v3.Q4_K_M.gguf", # model file
Expand Down
4 changes: 2 additions & 2 deletions llama_bringup/launch/cybertron.launch.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,11 +29,11 @@ def generate_launch_description():

return LaunchDescription([
create_llama_launch(
n_ctx=512,
n_ctx=2048,
n_batch=8,
n_gpu_layers=0,
n_threads=4,
n_predict=512,
n_predict=2048,

model_repo="TheBloke/MetaMath-Cybertron-Starling-GGUF",
model_filename="metamath-cybertron-starling.Q4_K_M.gguf",
Expand Down
4 changes: 2 additions & 2 deletions llama_bringup/launch/hermes.launch.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,11 +29,11 @@ def generate_launch_description():

return LaunchDescription([
create_llama_launch(
n_ctx=512,
n_ctx=2048,
n_batch=8,
n_gpu_layers=0,
n_threads=4,
n_predict=512,
n_predict=2048,

model_repo="TheBloke/OpenHermes-2.5-neural-chat-v3-3-Slerp-GGUF",
model_filename="openhermes-2.5-neural-chat-v3-3-slerp.Q4_K_M.gguf",
Expand Down
4 changes: 2 additions & 2 deletions llama_bringup/launch/marcoroni.launch.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,11 +29,11 @@ def generate_launch_description():

return LaunchDescription([
create_llama_launch(
n_ctx=512,
n_ctx=2048,
n_batch=8,
n_gpu_layers=0,
n_threads=4,
n_predict=512,
n_predict=2048,

model_repo="TheBloke/Marcoroni-7B-v3-GGUF",
model_filename="marcoroni-7b-v3.Q4_K_M.gguf",
Expand Down
4 changes: 2 additions & 2 deletions llama_bringup/launch/neural-chat.launch.py
Original file line number Diff line number Diff line change
Expand Up @@ -29,11 +29,11 @@ def generate_launch_description():

return LaunchDescription([
create_llama_launch(
n_ctx=512,
n_ctx=2048,
n_batch=8,
n_gpu_layers=0,
n_threads=4,
n_predict=512,
n_predict=2048,

model_repo="janhq/neural-chat-7b-v3-3-slerp-GGUF",
model_filename="neural-chat-7b-v3-3-slerp.Q4_K_M.gguf",
Expand Down

0 comments on commit 9ddeef2

Please sign in to comment.