kgdata.wikipedia.models.html_article#

Classes

AdditionalEntity(identifier, url, aspects)

HTMLArticle(name, page_id, date_modified, ...)

Model of the HTML page article from Wikipedia HTML Dumps.

NameAndURL(name, url)

class HTMLArticle(name: str, page_id: int, date_modified: str, url: str, lang: str, wdentity: Optional[str], additional_entities: List[AdditionalEntity], is_part_of: str, categories: List[NameAndURL], templates: List[NameAndURL], redirects: List[NameAndURL], html: str, wikitext: str)[source]#

Bases: object

Model of the HTML page article from Wikipedia HTML Dumps.

Parameters:
name: str#
page_id: int#
date_modified: str#
url: str#
lang: str#
wdentity: Optional[str]#
additional_entities: List[AdditionalEntity]#
is_part_of: str#
categories: List[NameAndURL]#
templates: List[NameAndURL]#
redirects: List[NameAndURL]#
html: str#
wikitext: str#
static from_dump_dict(o: dict) HTMLArticle[source]#
Parameters:

o (dict) –

Return type:

HTMLArticle

to_dict() dict[source]#
Return type:

dict

class AdditionalEntity(identifier: 'str', url: 'str', aspects: 'List[str]')[source]#

Bases: object

Parameters:
identifier: str#
url: str#
aspects: List[str]#
to_dict() dict[source]#
Return type:

dict

class NameAndURL(name: 'str', url: 'str')[source]#

Bases: object

Parameters:
  • name (str) –

  • url (str) –

name: str#
url: str#
to_dict() dict[source]#
Return type:

dict