All datasets contain JSON files (with one JSON object per line, so called JSON Lines). The objects themselves look similar to this example:
{
"similarityFirst":0.19148936170212766,
"pageTitle":"Arctic Monkeys",
"validFrom":"2019-07-13T19:05:09Z",
"pageID":1720451,
"content":[
"[[Alex Turner (musician)|Alex Turner]] – lead vocals, keyboards and synthesizers, rhythm and occasional lead guitar, piano (2002–present)",
"[[Matt Helders]] – drums, backing and lead vocals (2002–present)",
"[[Jamie Cook]] – lead and occasional rhythm guitar (2002–present); occasional keyboards (2018–present); backing vocals (2002–2006)",
"[[Nick O\u0027Malley]] – bass, backing vocals (2006–present)"
],
"contentHash":-354743718,
"itemCount":4,
"revisionId":906116756,
"similarityLast":1.0,
"contextType":"UPDATE",
"headings":"Band members",
"comment":"Reverted edits by [[Special:Contribs/104.176.172.183|104.176.172.183]] ([[User talk:104.176.172.183|talk]]) to last version by Robvanvee",
"position":1,
"user":{
"username":"C.Fred",
"id":461300
},
"contentType":"UNMODIFIED",
"key":"19239717-0",
"validTo":"2019-08-24T07:08:05Z"
}