Skip to content

Commit

Permalink
parse oracle file name from <code>xx</code>
Browse files Browse the repository at this point in the history
  • Loading branch information
stellaHSR committed Mar 19, 2024
1 parent 631a264 commit 740c963
Showing 1 changed file with 27 additions and 0 deletions.
27 changes: 27 additions & 0 deletions data/inference/make_datasets/parse_utils.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,27 @@
import re


def extract_scripts_from_codetext(codetext: str):
script_names = []
# 提供的文本内容,可能包含多个 [start of ... .py]
"""
[end of README.rst]
[start of sklearn/compose/_target.py]
... 文件内容 ...
[end of sklearn/compose/_target.py]
[start of another_module/example.py]
... 文件内容 ...
[end of another_module/example.py]
"""

# 使用正则表达式匹配所有 “[start of 任意字符.py]”
matches = re.findall(r"\[start of ([^\]]+\.py)\]", codetext)

if matches:
# 遍历所有匹配的文件名并打印
for script_name in matches:
print("Extracted script name:", script_name)
script_names.append(script_name)
else:
print("No script names found in the text.")
return script_names

0 comments on commit 740c963

Please sign in to comment.