Merge branch 'jafioti:main' into feature-conv3d

This commit is contained in:
NewBornRustacean
2024-05-03 10:50:28 +09:00
committed by GitHub
3 changed files with 12 additions and 5 deletions

View File

@@ -12,6 +12,6 @@ Cargo.lock
# MSVC Windows builds of rustc generate these, which store debugging information
*.pdb
setup/*.gguf
setup/*.json
.vscode
.vscode
setup/tokenizer.json

View File

@@ -0,0 +1,7 @@
#!/usr/bin/env bash
SCRIPT_DIR=$( cd -- "$( dirname -- "${BASH_SOURCE[0]}" )" &> /dev/null && pwd )
echo "Downloading Model and Tokenizer..."
curl --location https://luminal-public.s3.amazonaws.com/phi3/tokenizer.json --output $SCRIPT_DIR/tokenizer.json
curl --location https://luminal-public.s3.amazonaws.com/phi3/phi3.gguf --output $SCRIPT_DIR/phi3.gguf
echo "Done!"

View File

@@ -55,9 +55,9 @@ fn main() {
// Set up model loading
#[cfg(any(feature = "metal", feature = "cuda"))]
let q_weights = loader::q8_load("setup/phi-3-mini-4k-instruct.Q8_0.gguf", &model, &mut cx);
let q_weights = loader::q8_load("setup/phi3.gguf", &model, &mut cx);
#[cfg(all(not(feature = "metal"), not(feature = "cuda")))]
loader::q8_load("setup/phi-3-mini-4k-instruct.Q8_0.gguf", &model, &mut cx);
loader::q8_load("setup/phi3.gguf", &model, &mut cx);
println!("\t\t - {}ms", now.elapsed().as_millis());
print!("Compiling graph");