[extractor/common] Relax interaction count extraction in _json_ld
This commit is contained in:
		| @@ -68,6 +68,7 @@ from ..utils import ( | ||||
|     sanitized_Request, | ||||
|     sanitize_filename, | ||||
|     str_or_none, | ||||
|     str_to_int, | ||||
|     strip_or_none, | ||||
|     unescapeHTML, | ||||
|     unified_strdate, | ||||
| @@ -1248,7 +1249,10 @@ class InfoExtractor(object): | ||||
|                 interaction_type = is_e.get('interactionType') | ||||
|                 if not isinstance(interaction_type, compat_str): | ||||
|                     continue | ||||
|                 interaction_count = int_or_none(is_e.get('userInteractionCount')) | ||||
|                 # For interaction count some sites provide string instead of | ||||
|                 # an integer (as per spec) with non digit characters (e.g. ",") | ||||
|                 # so extracting count with more relaxed str_to_int | ||||
|                 interaction_count = str_to_int(is_e.get('userInteractionCount')) | ||||
|                 if interaction_count is None: | ||||
|                     continue | ||||
|                 count_kind = INTERACTION_TYPE_MAP.get(interaction_type.split('/')[-1]) | ||||
|   | ||||
		Reference in New Issue
	
	Block a user
	 Sergey M․
					Sergey M․