model="Samantha-7B-GGML/Samantha-7B.ggmlv3.q4_0.bin" use_mmap="True" use_mlock="True" n_threads="10" n_ctx="2048" n_gpu_layers="35"