cpms_lang_detect.py 438 B

12345678910111213141516171819
  1. import re
  2. def is_russian(text):
  3. # 正则表达式匹配西里尔字母
  4. cyrillic_pattern = re.compile('[\u0400-\u04FF]')
  5. if bool(cyrillic_pattern.search(text)):
  6. return 1
  7. else:
  8. return 0
  9. def is_spanish(text):
  10. # 正则表达式匹配西班牙语字符
  11. spanish_pattern = re.compile(r'[ñÑáéíóúÁÉÍÓÚ]')
  12. if bool(spanish_pattern.search(text)):
  13. return 1
  14. else:
  15. return 0