
| Current Path : /proc/thread-self/root/usr/local/lib/python3.8/dist-packages/silverware/htmltext/ |
Linux ift1.ift-informatik.de 5.4.0-216-generic #236-Ubuntu SMP Fri Apr 11 19:53:21 UTC 2025 x86_64 |
| Current File : //proc/thread-self/root/usr/local/lib/python3.8/dist-packages/silverware/htmltext/get_text.py |
from .get_raw_text import get_raw_text from ..string import get_alphabetic import re def get_text(tag, remove_non_alphabetic=False): """ :type tag: Tag :type remove_non_alphabetic: bool :rtype: NoneType or str """ text = get_raw_text(tag) text = text.strip() if re.search(r'^\s*Page \d+$', text): return None if remove_non_alphabetic: alphabetic = get_alphabetic(text) if len(alphabetic) < 2: return None else: return text else: return text