File tree 2 files changed +16
-2
lines changed
slm/applications/neural_search/recall/milvus
2 files changed +16
-2
lines changed Original file line number Diff line number Diff line change 91
91
92
92
```
93
93
94
+ 下载数据集并解压到当前目录:
95
+ ``` shell
96
+ wget https://bj.bcebos.com/v1/paddlenlp/data/literature_search_data.zip
97
+ unzip literature_search_data.zip
98
+ ```
99
+
94
100
<a name =" 向量检索 " ></a >
95
101
96
102
## 5. 向量检索
@@ -141,6 +147,10 @@ python milvus_ann_search.py --data_path milvus/milvus_data.csv \
141
147
* ` search ` : 是否检索向量
142
148
* ` batch_size ` : 表示的是一次性插入的向量的数量
143
149
150
+ 也可以运行脚本:
151
+ ```
152
+ sh scripts/feature_extract.sh
153
+ ```
144
154
145
155
| 数据量 | 时间 |
146
156
| ------------ | ------------ |
Original file line number Diff line number Diff line change 23
23
24
24
from paddlenlp .data import Pad , Tuple
25
25
from paddlenlp .transformers import AutoTokenizer
26
+ from paddlenlp .utils .env import (
27
+ PADDLE_INFERENCE_MODEL_SUFFIX ,
28
+ PADDLE_INFERENCE_WEIGHTS_SUFFIX ,
29
+ )
26
30
27
31
sys .path .append ("." )
28
32
@@ -59,8 +63,8 @@ def __init__(
59
63
self .max_seq_length = max_seq_length
60
64
self .batch_size = batch_size
61
65
62
- model_file = model_dir + "/inference.get_pooled_embedding.pdmodel "
63
- params_file = model_dir + "/inference.get_pooled_embedding.pdiparams "
66
+ model_file = model_dir + f "/inference.get_pooled_embedding{ PADDLE_INFERENCE_MODEL_SUFFIX } "
67
+ params_file = model_dir + f "/inference.get_pooled_embedding{ PADDLE_INFERENCE_WEIGHTS_SUFFIX } "
64
68
if not os .path .exists (model_file ):
65
69
raise ValueError ("not find model file path {}" .format (model_file ))
66
70
if not os .path .exists (params_file ):
You can’t perform that action at this time.
0 commit comments