dream
158 строк · 4.6 Кб
1services:
2agent:
3command: sh -c 'bin/wait && python -m deeppavlov_agent.run agent.pipeline_config=assistant_dists/document_based_qa_transformers/pipeline_conf.json'
4environment:
5WAIT_HOSTS: "sentseg:8011, combined-classification:8087, ranking-based-response-selector:8002,
6sentence-ranker:8128, transformers-lm-mistral-7b-128k:8185, doc-retriever:8165, dff-document-qa-transformers-llm-skill:8186"
7WAIT_HOSTS_TIMEOUT: ${WAIT_TIMEOUT:-1000}
8HIGH_PRIORITY_INTENTS: 1
9RESTRICTION_FOR_SENSITIVE_CASE: 1
10ALWAYS_TURN_ON_ALL_SKILLS: 0
11LANGUAGE: EN
12
13files:
14image: julienmeerschart/simple-file-upload-download-server
15
16sentseg:
17env_file: [ .env ]
18build:
19context: ./annotators/SentSeg/
20dockerfile: Dockerfile-test
21command: flask run -h 0.0.0.0 -p 8011
22environment:
23- FLASK_APP=server
24deploy:
25resources:
26limits:
27memory: 1.5G
28reservations:
29memory: 1.5G
30
31doc-retriever:
32env_file: [ .env ]
33build:
34context: .
35dockerfile: ./annotators/doc_retriever/Dockerfile
36args:
37SERVICE_PORT: 8165
38SERVICE_NAME: doc_retriever
39CONFIG_PATH: ./doc_retriever_config.json
40DOC_PATH_OR_LINK: http://files.deeppavlov.ai/dream_data/documents_for_qa/test_file_dream_repo.html,http://files.deeppavlov.ai/dream_data/documents_for_qa/alphabet_financial_report.txt,http://files.deeppavlov.ai/dream_data/documents_for_qa/test_file_jurafsky_chatbots.pdf
41PARAGRAPHS_NUM: 5
42FILE_SERVER_TIMEOUT: 30
43command: python -m flask run -h 0.0.0.0 -p 8165
44environment:
45- FLASK_APP=server
46- CUDA_VISIBLE_DEVICES=0
47deploy:
48resources:
49limits:
50memory: 5G
51reservations:
52memory: 5G
53
54combined-classification:
55env_file: [ .env ]
56build:
57args:
58CONFIG: combined_classifier.json
59SERVICE_PORT: 8087
60context: .
61dockerfile: ./annotators/combined_classification/Dockerfile
62command: gunicorn --workers=1 server:app -b 0.0.0.0:8087 --timeout 600
63environment:
64- CUDA_VISIBLE_DEVICES=0
65deploy:
66resources:
67limits:
68memory: 2G
69reservations:
70memory: 2G
71
72ranking-based-response-selector:
73env_file: [ .env ]
74build:
75args:
76SERVICE_PORT: 8002
77SERVICE_NAME: response_selector
78LANGUAGE: EN
79SENTENCE_RANKER_ANNOTATION_NAME: sentence_ranker
80SENTENCE_RANKER_SERVICE_URL: http://sentence-ranker:8128/respond
81SENTENCE_RANKER_TIMEOUT: 3
82N_UTTERANCES_CONTEXT: 5
83FILTER_TOXIC_OR_BADLISTED: 1
84context: .
85dockerfile: ./response_selectors/ranking_based_response_selector/Dockerfile
86command: flask run -h 0.0.0.0 -p 8002
87environment:
88- FLASK_APP=server
89deploy:
90resources:
91limits:
92memory: 100M
93reservations:
94memory: 100M
95
96sentence-ranker:
97env_file: [ .env ]
98build:
99args:
100SERVICE_PORT: 8128
101SERVICE_NAME: sentence_ranker
102PRETRAINED_MODEL_NAME_OR_PATH: sentence-transformers/all-MiniLM-L6-v2
103context: ./services/sentence_ranker/
104command: flask run -h 0.0.0.0 -p 8128
105environment:
106- CUDA_VISIBLE_DEVICES=0
107- FLASK_APP=server
108deploy:
109resources:
110limits:
111memory: 3G
112reservations:
113memory: 3G
114
115transformers-lm-mistral-7b-128k:
116env_file: [ .env ]
117build:
118args:
119SERVICE_PORT: 8185
120SERVICE_NAME: transformers_lm_mistral_7b_128k
121PRETRAINED_MODEL_NAME_OR_PATH: NousResearch/Yarn-Mistral-7b-128k
122HALF_PRECISION: 1
123USE_FLASH_ATTENTION_2: 1
124context: .
125dockerfile: ./services/transformers_lm/Dockerfile
126command: flask run -h 0.0.0.0 -p 8185
127environment:
128- CUDA_VISIBLE_DEVICES=0
129- FLASK_APP=server
130deploy:
131resources:
132limits:
133memory: 50G
134reservations:
135memory: 50G
136
137dff-document-qa-transformers-llm-skill:
138env_file: [ .env ]
139build:
140args:
141SERVICE_PORT: 8186
142SERVICE_NAME: dff_document_qa_llm_skill
143GENERATIVE_SERVICE_URL: http://transformers-lm-mistral-7b-128k:8185/respond
144GENERATIVE_SERVICE_CONFIG: transformers_mistral.json
145GENERATIVE_TIMEOUT: 120
146N_UTTERANCES_CONTEXT: 7
147FILE_SERVER_TIMEOUT: 30
148DOCUMENT_PROMPT_FILE: common/prompts/document_qa_instruction.json
149context: .
150dockerfile: ./skills/dff_document_qa_llm_skill/Dockerfile
151deploy:
152resources:
153limits:
154memory: 128M
155reservations:
156memory: 128M
157
158version: '3.7'
159