import re
from typing import Any, Optional, Union
from wikibaseintegrator.datatypes.basedatatype import BaseDataType
[docs]
class Lexeme(BaseDataType):
"""
Implements the Wikibase data type 'wikibase-lexeme'
"""
DTYPE = 'wikibase-lexeme'
sparql_query = '''
SELECT * WHERE {{
?item_id <{wb_url}/prop/{pid}> ?s .
?s <{wb_url}/prop/statement/{pid}> <{wb_url}/entity/{value}> .
}}
'''
[docs]
def __init__(self, value: Optional[Union[str, int]] = None, **kwargs: Any):
"""
Constructor, calls the superclass BaseDataType
:param value: The lexeme number to serve as a value
"""
super().__init__(**kwargs)
self.set_value(value=value)
[docs]
def set_value(self, value: Optional[Union[str, int]] = None):
assert isinstance(value, (str, int)) or value is None, f"Expected str or int, found {type(value)} ({value})"
if value:
if isinstance(value, str):
pattern = re.compile(r'^(?:[a-zA-Z]+:|.+\/entity\/)?L?([0-9]+)$')
matches = pattern.match(value)
if not matches:
raise ValueError(f"Invalid lexeme ID ({value}), format must be 'L[0-9]+'")
value = int(matches.group(1))
self.mainsnak.datavalue = {
'value': {
'entity-type': 'lexeme',
'numeric-id': value,
'id': f'L{value}'
},
'type': 'wikibase-entityid'
}
[docs]
def get_sparql_value(self) -> str:
return self.mainsnak.datavalue['value']['id']