Skip to content

Commit eadc04d

Browse files
committed
Avoid CV IDs in EF
1 parent 780cd06 commit eadc04d

File tree

1 file changed

+1
-1
lines changed

1 file changed

+1
-1
lines changed

backend/base/file_extraction.py

+1-1
Original file line numberDiff line numberDiff line change
@@ -23,7 +23,7 @@
2323

2424
volume_regex_snippet = r'\b(?:v(?:ol|olume)?)(?:\.\s|[\.\-\s])?(\d+(?:\s?\-\s?\d+)?|(?<!v)I{1,3})'
2525
year_regex_snippet = r'(?:(\d{4})(?:-\d{2}){0,2}|(\d{4})[\s\.]?[\-\s](?:[\s\.]?\d{4})?|(?:\d{2}-){1,2}(\d{4})|(\d{4})[\s\.\-_]Edition|(\d{4})\-\d{4}\s{3}\d{4})'
26-
issue_regex_snippet = r'(?!\d+(?:th|rd|st|\s?(?:gb|mb|kb)))(?<!\')(?:\d+(?:\.\d{1,2}|\.?[a-z0-9]+|[\s\-\._]?[½¼])?|[½¼])'
26+
issue_regex_snippet = r'(?!\d+(?:th|rd|st|\s?(?:gb|mb|kb)))(?<!\')(?<!cv[\s\-_])(?:\d+(?:\.\d{1,2}|\.?[a-z0-9]+|[\s\-\._]?[½¼])?|[½¼])'
2727

2828
# Cleaning the filename
2929
strip_filename_regex = compile(r'\(.*?\)|\[.*?\]|\{.*?\}', IGNORECASE)

0 commit comments

Comments
 (0)