Skip to content

Commit c73196e

Browse files
authored
Merge pull request #26 from scuuy/main
add 3 types of running of reasoning pipelines in statics, has been tested using `dataflow init` folder
2 parents f6711ff + 0f8a21e commit c73196e

File tree

3 files changed

+40
-16
lines changed

3 files changed

+40
-16
lines changed

dataflow/statics/pipelines/api_pipelines/reasoning_pipeline.py

Lines changed: 6 additions & 6 deletions
Original file line numberDiff line numberDiff line change
@@ -53,7 +53,7 @@ def __init__(self):
5353
llm_serving=llm_serving
5454
)
5555
########################## branch ############################
56-
self.answer_pipeline_root_step6 = AnswerPipelineRoot()
56+
# self.answer_pipeline_root_step6 = AnswerPipelineRoot()
5757
########################## answer ############################
5858
self.answer_generator_step7 = AnswerGenerator(
5959
llm_serving=llm_serving
@@ -103,11 +103,11 @@ def forward(self):
103103
output_key = "question_category"
104104
)
105105
############# branch #############
106-
self.answer_pipeline_root_step6.run(
107-
storage = self.storage.step(),
108-
input_answer_key = "output",
109-
input_gt_key = "golden_answer"
110-
)
106+
# self.answer_pipeline_root_step6.run(
107+
# storage = self.storage.step(),
108+
# input_answer_key = "output",
109+
# input_gt_key = "golden_answer"
110+
# )
111111
############## answer #############
112112
self.answer_generator_step7.run(
113113
storage = self.storage.step(),

dataflow/statics/pipelines/cpu_pipelines/reasoning_pipeline.py

Lines changed: 26 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -1,4 +1,8 @@
1-
from dataflow.operators.process.Reasoning import AnswerFormatterFilter
1+
from dataflow.operators.process.Reasoning import (
2+
AnswerFormatterFilter,
3+
AnswerGroundTruthFilter,
4+
AnswerNgramFilter,
5+
)
26
from dataflow.utils.storage import FileStorage
37

48
class ReasoningPipeline():
@@ -13,10 +17,30 @@ def __init__(self):
1317

1418
self.answer_format_filter_step1 = AnswerFormatterFilter()
1519

20+
self.answer_groundtruth_filter_step2 = AnswerGroundTruthFilter()
21+
22+
self.answer_ngram_filter_step3 = AnswerNgramFilter(
23+
min_score = 0.1,
24+
max_score = 1.0,
25+
ngrams = 5
26+
)
27+
1628
def forward(self):
1729
self.answer_format_filter_step1.run(
1830
storage = self.storage.step(),
19-
input_key = "generated_cot",
31+
input_key = "output",
32+
)
33+
34+
self.answer_groundtruth_filter_step2.run(
35+
storage = self.storage.step(),
36+
test_answer_key = "output",
37+
gt_answer_key = "golden_answer"
38+
)
39+
40+
self.answer_ngram_filter_step3.run(
41+
storage = self.storage.step(),
42+
question_key = "instruction",
43+
answer_key = "output"
2044
)
2145

2246
if __name__ == "__main__":

dataflow/statics/pipelines/gpu_pipelines/reasoning_pipeline.py

Lines changed: 8 additions & 8 deletions
Original file line numberDiff line numberDiff line change
@@ -27,8 +27,8 @@ def __init__(self):
2727
)
2828

2929
llm_serving = LocalModelLLMServing(
30-
model_name_or_path="Qwen2.5-7B-Instruct", # set to your own model path
31-
tensor_parallel_size=4,
30+
model_name_or_path="Qwen/Qwen2.5-7B-Instruct", # set to your own model path
31+
tensor_parallel_size=1,
3232
max_tokens=8192,
3333
model_source="local"
3434
)
@@ -52,7 +52,7 @@ def __init__(self):
5252
llm_serving=llm_serving
5353
)
5454
########################## branch ############################
55-
self.answer_pipeline_root_step6 = AnswerPipelineRoot()
55+
# self.answer_pipeline_root_step6 = AnswerPipelineRoot()
5656
########################## answer ############################
5757
self.answer_generator_step7 = AnswerGenerator(
5858
llm_serving=llm_serving
@@ -102,11 +102,11 @@ def forward(self):
102102
output_key = "question_category"
103103
)
104104
############# branch #############
105-
self.answer_pipeline_root_step6.run(
106-
storage = self.storage.step(),
107-
input_answer_key = "output",
108-
input_gt_key = "golden_answer"
109-
)
105+
# self.answer_pipeline_root_step6.run(
106+
# storage = self.storage.step(),
107+
# input_answer_key = "output",
108+
# input_gt_key = "golden_answer"
109+
# )
110110
############## answer #############
111111
self.answer_generator_step7.run(
112112
storage = self.storage.step(),

0 commit comments

Comments
 (0)