Skip to content

Navigation Menu

Sign in
Appearance settings

Search code, repositories, users, issues, pull requests...

Provide feedback

We read every piece of feedback, and take your input very seriously.

Saved searches

Use saved searches to filter your results more quickly

Sign up
Appearance settings

Commit f72c21d

Browse files
Changed model
1 parent 59fcac7 commit f72c21d

File tree

2 files changed

+20
-15
lines changed

2 files changed

+20
-15
lines changed

‎RagDemo.java‎

Lines changed: 19 additions & 14 deletions
Original file line numberDiff line numberDiff line change
@@ -14,18 +14,14 @@
1414
public class RagDemo {
1515

1616
static {
17-
Unirest.config().socketTimeout(120000).connectTimeout(120000);
17+
Unirest.config().socketTimeout(5 * 60 * 1000);
1818
}
1919

2020
public static void main(String[] args) throws Exception {
2121
var input = System.console().readLine("I'm looking for: ");
2222

23-
System.out.println("\nFinding closest products...");
23+
System.out.println("Finding closest products...");
2424
var context = getContext(input);
25-
System.out.println("-------------------------------------------------------------");
26-
System.out.println(context);
27-
System.out.println("-------------------------------------------------------------\n");
28-
2925
System.out.println("Generating response...");
3026
var prompt = buildPrompt(input, context);
3127
var response = getResponse(prompt);
@@ -34,10 +30,13 @@ public static void main(String[] args) throws Exception {
3430

3531
private static String getContext(String input) throws Exception {
3632
var requestBody = """
37-
{ "model": "bert-cpp-minilm-v6", "input": %s }
33+
{
34+
"model": "bert-cpp-minilm-v6",
35+
"input": %s
36+
}
3837
""".formatted(new ObjectMapper().writeValueAsString(input));
3938

40-
var response = Unirest.post("http://localhost:8080/v1/embeddings")
39+
var response = Unirest.post("http://127.0.0.1:8080/v1/embeddings")
4140
.header("Content-Type", "application/json")
4241
.body(requestBody)
4342
.asString().getBody();
@@ -53,7 +52,7 @@ SELECT id, CONCAT(
5352
FROM products
5453
WHERE embedding IS NOT NULL
5554
ORDER BY VEC_Distance(embedding, VEC_FromText(JSON_EXTRACT(:response, '$.data[0].embedding')))
56-
LIMIT 10
55+
LIMIT 7
5756
""")
5857
.addParameter("response", response)
5958
.executeAndFetchTable();
@@ -66,20 +65,26 @@ ORDER BY VEC_Distance(embedding, VEC_FromText(JSON_EXTRACT(:response, '$.data[0]
6665

6766
private static String buildPrompt(String input, Object context) {
6867
return """
69-
You are a sales assistant. I'm looking for %s.
70-
71-
Using the following information, recommend me a product in one single paragraph:
68+
I'm looking for %s. Using the following information, recommend me a product in one single paragraph:
7269
7370
%s
7471
""".formatted(input, context);
7572
}
7673

7774
private static String getResponse(String prompt) throws Exception {
7875
var requestBody = """
79-
{ "model": "phi-2", "messages": [{"role": "user", "content": %s, "temperature": 0.4}] }
76+
{
77+
"model": "phi-2-chat",
78+
"messages": [
79+
{"role": "system", "content": "You are a sales assistant."},
80+
{"role": "user", "content": %s}
81+
],
82+
"temperature": 0.2,
83+
"max_tokens": 100
84+
}
8085
""".formatted(new ObjectMapper().writeValueAsString(prompt));
8186

82-
var response = Unirest.post("http://localhost:8080/v1/chat/completions")
87+
var response = Unirest.post("http://127.0.0.1:8080/v1/chat/completions")
8388
.header("Content-Type", "application/json")
8489
.body(requestBody)
8590
.asString().getBody();

‎docker-compose.yml‎

Lines changed: 1 addition & 1 deletion
Original file line numberDiff line numberDiff line change
@@ -14,7 +14,7 @@ services:
1414
local-ai:
1515
image: localai/localai:master-ffmpeg-core
1616
container_name: local-ai
17-
command: bert-cpp phi-3.5-mini-instruct
17+
command: bert-cpp phi-2-chat
1818
ports:
1919
- "8080:8080"
2020
environment:

0 commit comments

Comments
(0)

AltStyle によって変換されたページ (->オリジナル) /