if (FALSE) {
# Simple usage with default settings (deterministic)
response <- quick_llama("Hello, how are you?")
# Raw text generation without chat template
raw_response <- quick_llama("Complete this: The capital of France is",
auto_format = FALSE)
# Custom system prompt
code_response <- quick_llama("Write a Python hello world program",
system_prompt = "You are a Python programming expert.")
# Creative writing with higher temperature
creative_response <- quick_llama("Tell me a story",
temperature = 0.8,
max_tokens = 200)
# Prevent repetition
no_repeat <- quick_llama("Explain AI",
repeat_last_n = 64,
penalty_repeat = 1.1)
# Multiple prompts (parallel processing)
responses <- quick_llama(c("Summarize AI", "Explain quantum computing"),
max_tokens = 150)
}
Run the code above in your browser using DataLab