mNo edit summary |
(Update package: OSW Core) Tag: Reverted |
||
(7 intermediate revisions by 2 users not shown) | |||
Line 1: | Line 1: | ||
-- mw.logObject(p.processJsondata({jsondata=p.loadJson({title="Item:OSW7d7193567ea14e4e89b74de88983b718", slot="jsondata"}).json, debug=true, mode="header"})) | |||
local lustache = require("Module:Lustache") | local lustache = require("Module:Lustache") | ||
Line 5: | Line 7: | ||
p.keys = { --jsonschema / json-ld keys | p.keys = { --jsonschema / json-ld keys | ||
category='type', | category='type', | ||
category_pseudoproperty='Category', -- Property:Category | |||
subcategory='subclass_of', | subcategory='subclass_of', | ||
schema_type='schema_type', | schema_type='schema_type', | ||
Line 20: | Line 23: | ||
} | } | ||
p.slots = { --slot names | p.slots = { --slot names | ||
main='main', | |||
jsondata='jsondata', | jsondata='jsondata', | ||
jsonschema='jsonschema', | jsonschema='jsonschema', | ||
Line 31: | Line 35: | ||
query='query' | query='query' | ||
} | } | ||
p.cache = {} | |||
--loads json from a wiki page | --loads json from a wiki page | ||
Line 37: | Line 43: | ||
function p.loadJson(args) | function p.loadJson(args) | ||
local page_title = p.defaultArg(args.title, "JsonSchema:Entity") --for testing | local page_title = p.defaultArg(args.title, "JsonSchema:Entity") --for testing | ||
local slot = p.defaultArg(args.slot, | local slot = p.defaultArg(args.slot, 'main') | ||
local debug = p.defaultArg(args.debug, nil) | local debug = p.defaultArg(args.debug, nil) | ||
local msg = "" | local msg = "" | ||
Line 43: | Line 49: | ||
local json = {} | local json = {} | ||
if (slot == | if p.cache[page_title] ~= nil then | ||
if p.cache[page_title][slot] ~= nil then | |||
if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsondata .. " of page " .. page_title .. " from cache <br>" end | |||
json = p.cache[page_title][slot] | |||
return {json=json, debug_msg=msg} | |||
end | |||
else p.cache[page_title] = {} | |||
end | |||
if (slot == 'main') then | |||
--json = mw.loadJsonData( "JsonSchema:Entity" ) --requires MediaWiki 1.39 | --json = mw.loadJsonData( "JsonSchema:Entity" ) --requires MediaWiki 1.39 | ||
local page = mw.title.makeTitle(p.splitString(page_title, ':')[1], p.splitString(page_title, ':')[2]) | local page = mw.title.makeTitle(p.splitString(page_title, ':')[1], p.splitString(page_title, ':')[2]) | ||
Line 49: | Line 64: | ||
if (text ~= nil) then json = mw.text.jsonDecode(text) end | if (text ~= nil) then json = mw.text.jsonDecode(text) end | ||
else | else | ||
if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsondata .. " | if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsondata .. " of page " .. page_title .. "<br>" end | ||
local text = mw.slots.slotContent( slot , page_title ) | local text = mw.slots.slotContent( slot , page_title ) | ||
if (text ~= nil) then json = mw.text.jsonDecode(text) end | if (text ~= nil) then json = mw.text.jsonDecode(text) end | ||
Line 55: | Line 70: | ||
--mw.logObject(json) | --mw.logObject(json) | ||
p.cache[page_title][slot] = json | |||
return {json=json, debug_msg=msg} | return {json=json, debug_msg=msg} | ||
end | end | ||
-- test: mw.logObject(p.walkJsonSchema({jsonschema=p.loadJson({title="Category:Hardware", slot="jsonschema"}).json, debug=true}).jsonschema) | -- test: mw.logObject(p.walkJsonSchema({jsonschema=p.loadJson({title="Category:Hardware", slot="jsonschema"}).json, debug=true}).jsonschema) | ||
Line 105: | Line 122: | ||
end | end | ||
if (root) then | if (root) then | ||
for i, category in ipairs(visited) do | for i, category in ipairs(visited) do | ||
jsonschema = p.tableMerge(jsonschema, jsonschemas[category]) | --merge all schemas. we need to make a copy here, otherwise jsonschemas["Category:Entity"] contains the merged schema | ||
jsonschema = p.copy(p.tableMerge(jsonschema, jsonschemas[category])) | |||
end | end | ||
end | end | ||
Line 149: | Line 166: | ||
-- mustache can handle objects and array to we can parse it directly | -- mustache can handle objects and array to we can parse it directly | ||
-- todo: handle nested templates | -- todo: handle nested templates | ||
if (debug) then msg = msg .. "Parse mustache template " .. eval_template.value .. " with params " .. mw.dumpObject( | local template_param = {[k]=v} | ||
jsondata[k] = lustache:render(eval_template.value, { | if (eval_template.root_key == false) then template_param = v end | ||
if (debug) then msg = msg .. "Parse mustache template " .. eval_template.value .. " with params " .. mw.dumpObject( template_param ) .. "\n<br>" end | |||
jsondata[k] = lustache:render(eval_template.value, template_param, p.tableMerge({self=eval_template.value}, eval_template.partials)) -- render with self as registered partial for recursion | |||
if (eval_template.type == "mustache-wikitext") then | if (eval_template.type == "mustache-wikitext") then | ||
jsondata[k] = frame:preprocess( jsondata[k] ) | jsondata[k] = frame:preprocess( jsondata[k] ) | ||
Line 185: | Line 204: | ||
end | end | ||
else | else | ||
if (eval_template ~= nil and eval_template | if (eval_template ~= nil and eval_template.value ~= nil) then | ||
--evaluate single array item string as json {"self": "<value>", ".": "<value>"} | |||
--evaluate single array item string as json {"self": "<value>", ".": "<value>"} => does not work since jsondata is an object | |||
mw. | --e = p.expandEmbeddedTemplates({frame=frame, jsondata={["self"]=e,["."]=e}, jsonschema=p.defaultArgPath(jsonschema, {"properties", k, "items"}, {}), template=eval_template, mode=mode, stringify_arrays=stringify_arrays}) | ||
e = | |||
v[i] = e | |||
if (eval_template.type == "mustache" or eval_template.type == "mustache-wikitext") then | |||
if (debug) then msg = msg .. "Parse mustache template " .. eval_template.value .. " with params " .. mw.dumpObject( e ) .. "\n<br>" end | |||
-- {{.}} in the template will be the value of e | |||
e = lustache:render(eval_template.value, e, p.tableMerge({self=eval_template.value}, eval_template.partials)) -- render with self as registered partial for recursion | |||
end | |||
if (eval_template.type == "mustache-wikitext") then --or eval_template.type == "wikitext") then | |||
if (debug) then msg = msg .. "Parse wikitext template " .. e .. " with params " .. mw.dumpObject( e ) .. "\n<br>" end | |||
e = frame:preprocess( e ) | |||
end | |||
v[i] = e -- update array | |||
end | end | ||
if (stringify_arrays) then string_list = string_list .. e .. ";" end | if (stringify_arrays) then string_list = string_list .. e .. ";" end | ||
Line 258: | Line 287: | ||
--jsonschema = p.defaultArg(jsonschema, {}) | --jsonschema = p.defaultArg(jsonschema, {}) | ||
--jsondata = p.defaultArg(jsondata, {}) | --jsondata = p.defaultArg(jsondata, {}) | ||
if (categories == nil) then categories = jsondata[p.keys.category] end | --if (categories == nil) then categories = jsondata[p.keys.category] end -- let function param overwrite json property | ||
if (not p.nilOrEmpty(jsondata[p.keys.category])) then categories = jsondata[p.keys.category] end -- let json property overwrite function param | |||
local schema_res = p.walkJsonSchema({jsonschema=jsonschema, categories=categories, mode=mode, recursive=recursive, debug=debug}) | local schema_res = p.walkJsonSchema({jsonschema=jsonschema, categories=categories, mode=mode, recursive=recursive, debug=debug}) | ||
local expand_res = p.expandJsonRef({json=schema_res.jsonschema, debug=debug}) | |||
--mw. | jsonschema = expand_res.json | ||
--mw.log(mw.text.jsonEncode(jsonschema)) | |||
local display_label = p.defaultArgPath(jsondata, {p.keys.name}, "") | local display_label = p.defaultArgPath(jsondata, {p.keys.name}, "") | ||
Line 279: | Line 310: | ||
local smw_res = nil | local smw_res = nil | ||
if (mode == p.mode.header) then | if (mode == p.mode.header) then | ||
-- get the semantic properties by looking up the json keys in the json-ld context | |||
smw_res = p.getSemanticProperties({jsonschema=jsonschema, jsondata=json_res_store.res, store=false, debug=debug}) | smw_res = p.getSemanticProperties({jsonschema=jsonschema, jsondata=json_res_store.res, store=false, debug=debug}) | ||
-- store metadata where properties were defined / overridden | |||
for i, category in ipairs(schema_res.visited) do | |||
for k, v in pairs(schema_res.jsonschemas[category]['properties']) do | |||
if smw_res.definitions[k] == nil then smw_res.definitions[k] = {} end | |||
if smw_res.definitions[k]['defined_in'] == nil then smw_res.definitions[k]['defined_in'] = {} end | |||
table.insert(smw_res.definitions[k]['defined_in'], category) | |||
end | |||
end | |||
-- embed json-ld in resulting html for search engine discovery | |||
jsonld["@context"] = smw_res.context | jsonld["@context"] = smw_res.context | ||
jsonld["@type"] = p.tableMerge(p.tablefy(jsonschema.schema_type), p.tablefy(jsonld["@type"])) -- | jsonld["@type"] = p.tableMerge(p.tablefy(jsonschema.schema_type), p.tablefy(jsonld["@type"])) -- | ||
Line 302: | Line 346: | ||
for i, category in ipairs(schema_res.visited) do | for i, category in ipairs(schema_res.visited) do | ||
if (mode == p.mode.footer) then category = schema_res.visited[max_index - i +1] end --reverse order for footer templates | if (mode == p.mode.footer) then category = schema_res.visited[max_index - i +1] end --reverse order for footer templates | ||
local | local super_jsonschema = schema_res.jsonschemas[category] | ||
local template = schema_res.templates[category] | local template = schema_res.templates[category] | ||
if (template ~= nil) then | if (template ~= nil) then | ||
Line 311: | Line 355: | ||
end | end | ||
local child = frame:newChild{args=stripped_jsondata} | local child = frame:newChild{args=stripped_jsondata} | ||
if ( template:sub(1, #"=") == "=" ) then template = "\n" .. template end -- add line break if template starts with heading (otherwise not rendered by mw parser) | |||
wikitext = wikitext .. child:preprocess( template ) | wikitext = wikitext .. child:preprocess( template ) | ||
elseif (mode == p.mode.header) then | elseif (mode == p.mode.header) then | ||
local infobox_res = p.renderInfoBox({jsonschema=jsonschema, jsondata=jsondata}) | local ignore_properties = {[p.keys.category]=true} -- don't render type/category on every subclass | ||
for j, subcategory in ipairs(schema_res.visited) do | |||
if j > i then | |||
local subjsonschema = schema_res.jsonschemas[subcategory] | |||
for k, v in pairs(subjsonschema['properties']) do | |||
-- skip properties that are overwritten in subschemas, render them only once at the most specific position | |||
ignore_properties[k] = true | |||
end | |||
end | |||
end | |||
-- render the infobox for the schema itself and every super_schema using always the global json-ld context (merged within walkJsonSchema()) | |||
-- context needs to be preprocessed with buildContext() since the generic json/table merge of the @context atttribute produces a list of strings (remote context) and context objects | |||
-- context is already build in p.getSemanticProperties. schema_allOfMerged is used to provide the full schema for overridden properties | |||
local infobox_res = p.renderInfoBox({jsonschema=super_jsonschema, schema_allOfMerged=jsonschema, context=smw_res.context, property_definitions=smw_res.definitions, jsondata=jsondata, ignore_properties=ignore_properties}) | |||
wikitext = wikitext .. frame:preprocess( infobox_res.wikitext ) | wikitext = wikitext .. frame:preprocess( infobox_res.wikitext ) | ||
end | end | ||
Line 320: | Line 378: | ||
--local display_label = "" | --local display_label = "" | ||
--if (jsondata[p.keys.label] ~= nil) then display_label = p.splitString(jsondata[p.keys.label], '@')[1] end | --if (jsondata[p.keys.label] ~= nil) then display_label = p.splitString(jsondata[p.keys.label], '@')[1] end | ||
local set_categories_in_wikitext = {} | |||
p.tableMerge(set_categories_in_wikitext, json_res_store.res[p.keys.subcategory]) --classes/categories, nil for items | |||
if (title.nsText ~= "Category") then --items | |||
p.tableMerge(set_categories_in_wikitext, json_res_store.res[p.keys.category]) -- categories from schema type | |||
end | |||
-- Todo: Consider moving the category and this block to p.getSemanticProperties with store=true. However, settings categories with @category is only possible for subobjects | |||
if (smw_res ~= nil) then | if (smw_res ~= nil) then | ||
if (debug) then msg = msg .. "Store page properties" end | if (debug) then msg = msg .. "Store page properties" end | ||
-- category handling | |||
p.tableMerge(set_categories_in_wikitext, smw_res.properties[p.keys.category_pseudoproperty]) | |||
smw_res.properties[p.keys.category_pseudoproperty] = nil -- delete pseudo property | |||
smw_res.properties['HasOswId'] = mw.title.getCurrentTitle().fullText --set special property OswId to own title | |||
-- label and display title handling | |||
smw_res.properties['Display title of'] = display_label --set special property display title | smw_res.properties['Display title of'] = display_label --set special property display title | ||
smw_res.properties['Display title of lowercase'] = display_label:lower() --store lowercase for case insensitive query | |||
smw_res.properties['Display title of normalized'] = display_label:lower():gsub('[^%w]+','') --store with all non-alphanumeric chars removed for normalized query | |||
p.setNormalizedLabel(smw_res.properties) --build normalized multilang label | |||
mw.ext.displaytitle.set(display_label) | mw.ext.displaytitle.set(display_label) | ||
--smw_res.properties['@category'] = jsondata[p.keys.category] | --smw_res.properties['@category'] = jsondata[p.keys.category] | ||
Line 338: | Line 410: | ||
--wikitext = mw.dumpObject(smw_res.properties) .. wikitext | --wikitext = mw.dumpObject(smw_res.properties) .. wikitext | ||
end | end | ||
wikitext = wikitext .. "\n" .. p.setCategories({categories=set_categories_in_wikitext, sortkey=display_label}).wikitext | |||
if (debug) then mw.logObject(res) end | if (debug) then mw.logObject(res) end | ||
Line 347: | Line 420: | ||
-- test: mw.logObject(p.renderInfoBox({jsonschema=p.loadJson({title="JsonSchema:Entity"}).json, jsondata={uuid="123123"}})) | -- test: mw.logObject(p.renderInfoBox({jsonschema=p.loadJson({title="JsonSchema:Entity"}).json, jsondata={uuid="123123"}})) | ||
function p.renderInfoBox(args) | function p.renderInfoBox(args) | ||
local debug = p.defaultArg(args.debug, false) | |||
local jsondata = p.defaultArg(args.jsondata, {}) | local jsondata = p.defaultArg(args.jsondata, {}) | ||
local schema = p.defaultArg(args.jsonschema, nil) | local schema = p.defaultArg(args.jsonschema, nil) -- local schema from the perspective of the current category | ||
local | local schema_allOfMerged = p.defaultArg(args.schema_allOfMerged, schema) -- global schema with allOfs merged | ||
local | local property_definitions = p.defaultArg(args.property_definitions, {}) -- dict schema_key: {property: <smw_property>, ...} | ||
local res = "" | local res = "" | ||
if schema == nil then return res end | if schema == nil then return res end | ||
local context = p.defaultArg(args.context, p.buildContext({jsonschema=schema}).context) | |||
local ignore_properties = p.defaultArg(args.ignore_properties, {}) | |||
local schema_label = "" | local schema_label = "" | ||
if schema['title'] ~= nil then schema_label = schema['title'] end | if schema['title'] ~= nil then schema_label = schema['title'] end | ||
Line 361: | Line 439: | ||
:attr( 'class', 'info_box' ) | :attr( 'class', 'info_box' ) | ||
:tag( 'tr' ) | :tag( 'tr' ) | ||
:tag( ' | :tag( 'th' ) | ||
:attr( 'class', ' | :attr( 'class', 'heading' ) | ||
:attr( 'colspan', '2' ) | :attr( 'colspan', '2' ) | ||
:wikitext( schema_label ) | :wikitext( schema_label ) | ||
Line 368: | Line 446: | ||
if (not ignore_properties[k]) then | if (not ignore_properties[k]) then | ||
if (schema['properties'] ~= nil and schema['properties'][k] ~= nil and (type(v) ~= 'table' or v[1] ~= nil)) then --literal or literal array | if (schema['properties'] ~= nil and schema['properties'][k] ~= nil and (type(v) ~= 'table' or v[1] ~= nil)) then --literal or literal array | ||
local def = | local def = schema_allOfMerged['properties'][k] | ||
--mw.logObject(def) | --mw.logObject(def) | ||
local label = k | local label = k | ||
if def['title'] ~= nil then label = def['title'] end | if def['title'] ~= nil then label = def['title'] end | ||
if def['title*'] ~= nil then -- multilang label with switch | |||
label = "{{#switch:{{USERLANGUAGECODE}} |#default=" .. label | |||
for k,v in pairs(def['title*']) do label = label .. " |" .. k .. "=" .. v end | |||
label = label .. " }}" | |||
end | |||
local description = "" | |||
if def['description'] ~= nil then description = def['description'] end | |||
if def['description*'] ~= nil then -- multilang label with switch | |||
description = "{{#switch:{{USERLANGUAGECODE}} |#default=" .. description | |||
for k,v in pairs(def['description*']) do description = description .. " |" .. k .. "=" .. v end | |||
description = description .. " }}" | |||
end | |||
if (p.tableLength(p.defaultArgPath(property_definitions, {k, 'defined_in'}, {})) > 0) then description = description .. "<br>Definition: " end | |||
for i, c in pairs(p.defaultArgPath(property_definitions, {k, 'defined_in'}, {})) do | |||
if (i > 1) then description = description .. ", " end | |||
description = description .. "[[:" ..c .. "]]" | |||
end | |||
if (description ~= "") then description = "{{#info: " .. description .. "|note }}" end -- smw tooltip | |||
label = label .. description | |||
--res = res .. title ": " .. v | --res = res .. title ": " .. v | ||
local cell = tbl:tag( 'tr' ) | local cell = tbl:tag( 'tr' ) | ||
Line 382: | Line 482: | ||
if (type(e) ~= 'table') then | if (type(e) ~= 'table') then | ||
local p_type = p.defaultArgPath(context, {k, '@type'}, '@value') | local p_type = p.defaultArgPath(context, {k, '@type'}, '@value') | ||
if (p_type == '@id') then e = "[[" .. string. | if (p_type == '@id' and p.defaultArgPath(def, {'items', 'type'}, 'unknown') == 'string' and def['eval_template'] == nil) then | ||
-- auto-link (OSW-)IDs if no eval_template is present | |||
e = string.gsub(e, "Category:", ":Category:") -- make sure category links work | |||
e = string.gsub(e, "File:", ":File:") -- do not embedd images but link to them | |||
e = "[[" .. e .. "]]" | |||
elseif (p_type == 'xsd:date') then -- formate date with user preferences | |||
e = "{{#dateformat:" .. e .. "|ymd}}" | |||
elseif (p_type == 'xsd:dateTime') then -- formate time with user preferences | |||
local smw_property = p.defaultArgPath(property_definitions, {k, 'property'}) | |||
if (smw_property ~= nil) then e = "{{#ask: [[{{FULLPAGENAME}}]]|?" .. smw_property .. "#LOCL#TO= |format=plain |mainlabel=-}}" | |||
else | |||
local _, _, date, hours, minutes = string.find(e, "(%S+)[T ](%S+)[:](%S+)[:?]") | |||
e = "{{#dateformat:" .. date .. "|ymd}} " .. hours .. ":" .. minutes .. " (UTC)" | |||
end | |||
elseif (type(v) == 'boolean') then | |||
if (v) then v = "✅" else v = "❌" end -- green check mark or red cross | |||
elseif ((string.len(e) > 100) and (string.find(e, "{{") == nil) and (string.find(e, "</") == nil)) then | |||
e = string.sub(e, 1, 100) .. "..."; -- limit infobox plain text to max 100 chars | |||
elseif (debug) then | |||
mw.log("Unformated: " .. k .. " " .. p.defaultArgPath(def, {'items', 'type'}, 'unknown')) | |||
mw.logObject(def) | |||
end | |||
cell:wikitext("\n* " .. e .. "") | cell:wikitext("\n* " .. e .. "") | ||
end | end | ||
Line 388: | Line 509: | ||
else | else | ||
local p_type = p.defaultArgPath(context, {k, '@type'}, '@value') | local p_type = p.defaultArgPath(context, {k, '@type'}, '@value') | ||
if (p_type == '@id') then v = "[[" .. string. | if (p_type == '@id' and p.defaultArgPath(def, {'type'}, 'unknown') == 'string' and def['eval_template'] == nil) then | ||
cell:wikitext( v ) | -- auto-link (OSW-)IDs if no eval_template is present | ||
v = string.gsub(v, "Category:", ":Category:") -- make sure category links work | |||
v = string.gsub(v, "File:", ":File:") -- do not embedd images but link to them | |||
v = "[[" .. v .. "]]" | |||
elseif (p_type == 'xsd:date') then -- formate date & time with user preferences | |||
v = "{{#dateformat:" .. v .. "|ymd}}" | |||
elseif (p_type == 'xsd:dateTime') then -- formate time with user preferences | |||
local smw_property = p.defaultArgPath(property_definitions, {k, 'property'}) | |||
if (smw_property ~= nil) then v = "{{#ask: [[{{FULLPAGENAME}}]]|?" .. smw_property .. "#LOCL#TO= |format=plain |mainlabel=-}}" | |||
else | |||
local _, _, date, hours, minutes = string.find(v, "(%S+)[T ](%S+)[:](%S+)[:?]") | |||
v = "{{#dateformat:" .. date .. "|ymd}} " .. hours .. ":" .. minutes .. " (UTC)" | |||
end | |||
elseif (type(v) == 'boolean') then | |||
if (v) then v = "✅" else v = "❌" end -- green check mark or red cross | |||
elseif ((string.len(v) > 100) and (string.find(v, "{{") == nil) and (string.find(v, "</") == nil)) then | |||
v = string.sub(v, 1, 100) .. "..."; -- limit infobox plain text to max 100 chars | |||
elseif (debug) then | |||
mw.log("Unformated: " .. k .. " " .. p.defaultArgPath(def, {'type'}, 'unknown')) | |||
mw.logObject(def) | |||
end | |||
cell:wikitext("\n" .. v .. "") | |||
end | end | ||
end | end | ||
Line 453: | Line 595: | ||
jsonschema = p.expandJsonRef({json=p.loadJson({title=category, slot="jsonschema"}).json}).json | jsonschema = p.expandJsonRef({json=p.loadJson({title=category, slot="jsonschema"}).json}).json | ||
mw.logObject(p.buildContext({jsonschema=jsonschema, debug=true})) | mw.logObject(p.buildContext({jsonschema=jsonschema, debug=true})) | ||
mw.log(mw.text.jsonEncode(p.buildContext({jsonschema=jsonschema, debug=false}).context)) | |||
or | or | ||
jsonschema = { | jsonschema = { | ||
Line 475: | Line 618: | ||
--]] | --]] | ||
-- constructs a property specific local jsonld context | |||
function p.buildContext(args) | function p.buildContext(args) | ||
local schema = p.defaultArg(args.jsonschema, {}) | local schema = p.defaultArg(args.jsonschema, {}) | ||
Line 486: | Line 630: | ||
elseif (type(v) == 'table' and v[1] ~= nil) then --custom addtional mappings, e. g. "type*": ["Property:HasType"] | elseif (type(v) == 'table' and v[1] ~= nil) then --custom addtional mappings, e. g. "type*": ["Property:HasType"] | ||
result[k] = v | result[k] = v | ||
elseif (type(v) == 'table' and v['@id'] == nil) then --subcontext | elseif (type(v) == 'table' and v['@id'] == nil and v['@reverse'] == nil) then --subcontext | ||
p.tableMerge(result, p.buildContext({context=v}).context) | p.tableMerge(result, p.buildContext({context=v}).context) | ||
else | else | ||
Line 495: | Line 639: | ||
local properties = p.defaultArg(schema.properties, {}) | local properties = p.defaultArg(schema.properties, {}) | ||
-- build property context | |||
for k,v in pairs(properties) do | for k,v in pairs(properties) do | ||
local subcontext = nil | local subcontext = nil | ||
Line 501: | Line 646: | ||
subcontext = p.buildContext({jsonschema=properties[k]}).context | subcontext = p.buildContext({jsonschema=properties[k]}).context | ||
elseif (p.defaultArgPath(properties, {k, 'items', 'type'}) == 'object') then | elseif (p.defaultArgPath(properties, {k, 'items', 'type'}) == 'object') then | ||
mw.logObject(properties[k]['items']) | --mw.logObject(properties[k]['items']) | ||
subcontext = p.buildContext({jsonschema=properties[k]['items']}).context | subcontext = p.buildContext({jsonschema=properties[k]['items']}).context | ||
end | end | ||
Line 515: | Line 660: | ||
--maps jsondata values to semantic properties by using the @context attribute within the schema | --maps jsondata values to semantic properties by using the @context attribute within the schema | ||
--test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={test="Property:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true})) | --test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={test="Property:schema:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true})) | ||
--test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={"some uri",{test="Property:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true})) | --test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={"some uri",{test="Property:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true})) | ||
--[[ | --[[ | ||
Line 540: | Line 685: | ||
local schema = p.defaultArg(args.jsonschema, {}) | local schema = p.defaultArg(args.jsonschema, {}) | ||
local subschema = p.defaultArg(args.subschema, schema) | local subschema = p.defaultArg(args.subschema, schema) | ||
local parent_schema_property = p.defaultArg(args.parent_schema_property, {}) | local parent_schema_property = p.defaultArg(args.parent_schema_property, {}) -- ToDo: Not used except in getSemanticQuery => remove | ||
local store = p.defaultArg(args.store, false) | local store = p.defaultArg(args.store, false) | ||
local root = p.defaultArg(args.root, true) | local root = p.defaultArg(args.root, true) | ||
local properties = p.defaultArg(args.properties, {}) --semantic properties to store, dict key=property_name, value=array of string values | |||
local debug = p.defaultArg(args.debug, false) | local debug = p.defaultArg(args.debug, false) | ||
--if (debug) then mw.logObject("Call getSemanticProperties with args " .. mw.dumpObject( args ) .. "\n<br>") end | --if (debug) then mw.logObject("Call getSemanticProperties with args " .. mw.dumpObject( args ) .. "\n<br>") end | ||
local | local subjectId = mw.title.getCurrentTitle().fullText | ||
local subobjectId = nil | |||
if (root == false and jsondata['uuid'] ~= nil) then | |||
subobjectId = "OSW" .. string.gsub(jsondata['uuid'], "-", "") | |||
subjectId = subjectId .. '#' .. subobjectId | |||
end | |||
local property_data = {} | local property_data = {} | ||
local context = p.defaultArg(args.context, p.buildContext({jsonschema=schema}).context) | local context = p.defaultArg(args.context, p.buildContext({jsonschema=schema}).context) | ||
Line 562: | Line 714: | ||
for k,v in pairs(jsondata) do | for k,v in pairs(jsondata) do | ||
local property_names = {} | local property_names = {} | ||
local subobject_properties = {} -- reverse properties to store in the subobject | |||
local mapping_found = false | local mapping_found = false | ||
local property_definitions = {} | local property_definitions = {} -- list of objects {id=..., reverse=...} | ||
for term, def in pairs(context) do | for term, def in pairs(context) do | ||
local term_parts = p.splitString(term, "*") | local term_parts = p.splitString(term, "*") | ||
if ( | if (term_parts[1] == k) then --custom additional mapping term*(*...): "Property:..." | ||
if type(def) == 'table' then table.insert(property_definitions, def["@id"]) | if type(def) == 'table' then | ||
else table.insert(property_definitions, def) end | -- note: json-ld allows only @id OR @reverse | ||
if (def["@id"] ~= nil) then table.insert(property_definitions, {id=def["@id"], reverse=false}) end | |||
if (def["@reverse"] ~= nil) then table.insert(property_definitions, {id=def["@reverse"], reverse=true}) end | |||
else table.insert(property_definitions, {id=def}) end | |||
end | end | ||
end | end | ||
if (debug) then mw.logObject(property_definitions) end | if (debug) then mw.logObject(property_definitions) end | ||
for i,e in ipairs(property_definitions) do | for i,e in ipairs(property_definitions) do | ||
local property_definition = p.splitString( | local id = e["id"] | ||
local property_definition = p.splitString(id, ':') | |||
if property_definition[1] == p.keys.property_ns_prefix then | if property_definition[1] == p.keys.property_ns_prefix then | ||
mapping_found = true | mapping_found = true | ||
table.insert(property_names, | property_name = string.gsub(id, p.keys.property_ns_prefix .. ":", "") -- also allow prefix properties like: Property:schema:url | ||
if (e["reverse"]) then -- reverse properties are handled in the respective subobject | |||
if (subobject_properties[property_name] == nil) then subobject_properties[property_name] = {} end --initialize empty list | |||
table.insert(subobject_properties[property_name], subjectId) -- add triple subobject -property-> subject | |||
else table.insert(property_names, property_name) end | |||
local schema_property = p.defaultArg(schema_properties[k], {}) | local schema_property = p.defaultArg(schema_properties[k], {}) | ||
local schema_type = p.defaultArg(schema_property.type, nil) --todo: also load smw property type on demand | local schema_type = p.defaultArg(schema_property.type, nil) --todo: also load smw property type on demand | ||
property_data[k] = {schema_type=schema_type, schema_data=schema_property, property= | property_data[k] = {schema_type=schema_type, schema_data=schema_property, property=property_name, value=v, reverse=e["reverse"]} | ||
end | end | ||
end | end | ||
Line 596: | Line 754: | ||
local values = {} | local values = {} | ||
if (v[1] == nil) then --key value array = object/dict | if (v[1] == nil) then --key value array = object/dict | ||
local subproperties_res = p.getSemanticProperties({jsonschema=schema, jsondata=v, store=true, root=false, debug=debug, context=context, subschema=schema_properties[k], parent_schema_property=property_data[k]}) | local subproperties_res = p.getSemanticProperties({jsonschema=schema, jsondata=v, properties=p.copy(subobject_properties), store=true, root=false, debug=debug, context=context, subschema=schema_properties[k], parent_schema_property=property_data[k]}) | ||
local id = subproperties_res.id --subobject_id | local id = subproperties_res.id --subobject_id | ||
if (id ~= nil) then | if (id ~= nil) then | ||
Line 606: | Line 764: | ||
for i, e in pairs(v) do | for i, e in pairs(v) do | ||
if (type(e) == 'table') then | if (type(e) == 'table') then | ||
local subproperties_res = p.getSemanticProperties({jsonschema=schema, jsondata=e, store=true, root=false, debug=debug, context=context, subschema=schema_properties[k], parent_schema_property=property_data[k]}) | local subproperties_res = p.getSemanticProperties({jsonschema=schema, jsondata=e, properties=p.copy(subobject_properties), store=true, root=false, debug=debug, context=context, subschema=schema_properties[k], parent_schema_property=property_data[k]}) | ||
local id = subproperties_res.id --subobject_id | local id = subproperties_res.id --subobject_id | ||
if (id ~= nil) then | if (id ~= nil) then | ||
Line 635: | Line 793: | ||
end | end | ||
local store_res = nil | local store_res = nil | ||
if (store) then | if (store) then | ||
properties['HasOswId'] = subjectId | |||
if (root) then | if (root) then | ||
if (debug) then mw.logObject("Store page properties") end | if (debug) then mw.logObject("Store page properties") end | ||
store_res = mw.smw.set( properties ) --store as semantic properties | store_res = mw.smw.set( properties ) --store as semantic properties | ||
else | else | ||
properties['@category'] = {} | |||
p.tableMerge(properties['@category'], jsondata[p.keys.category]) -- from json property 'type' | |||
properties['@category'] | p.tableMerge(properties['@category'], properties[p.keys.category_pseudoproperty]) -- from json-ld context 'Property:Category' | ||
properties[p.keys.category_pseudoproperty] = nil -- delete pseudo property | |||
if (jsondata[p.keys.name] ~= nil) then properties['Display title of'] = jsondata[p.keys.name] | if (jsondata[p.keys.name] ~= nil) then properties['Display title of'] = jsondata[p.keys.name] | ||
elseif (jsondata[p.keys.label] ~= nil and jsondata[p.keys.label][1] ~= nil) then properties['Display title of'] = p.splitString(jsondata[p.keys.label][1], '@')[1] | elseif (jsondata[p.keys.label] ~= nil and jsondata[p.keys.label][1] ~= nil) then properties['Display title of'] = p.splitString(jsondata[p.keys.label][1], '@')[1] | ||
else properties['Display title of'] = p.defaultArg(subschema['title'], "") end | |||
p.setNormalizedLabel(properties) --build normalized multilang label | |||
if (p.tableLength(properties) > 0) then | if (p.tableLength(properties) > 0) then | ||
store_res = mw.smw.subobject( properties, subobjectId ) --store as subobject | store_res = mw.smw.subobject( properties, subobjectId ) --store as subobject | ||
Line 674: | Line 830: | ||
if (statement["HasSubject"] == nil or statement["HasSubject"][1] == nil or statement["HasSubject"][1] == "") then --implicit subject | if (statement["HasSubject"] == nil or statement["HasSubject"][1] == nil or statement["HasSubject"][1] == "") then --implicit subject | ||
if (statement["HasProperty"] ~= nil and statement["HasProperty"][1] ~= nil and statement["HasProperty"][1] ~= "" and statement["HasObject"] ~= nil) then | if (statement["HasProperty"] ~= nil and statement["HasProperty"][1] ~= nil and statement["HasProperty"][1] ~= "" and statement["HasObject"] ~= nil) then | ||
local property = | local property = string.gsub(statement["HasProperty"][1], p.keys.property_ns_prefix .. ":", "") -- also allow prefix properties like: Property:schema:url | ||
if (debug) then | if (debug) then | ||
mw.log("Set property " .. property .. " from statement to ") | mw.log("Set property " .. property .. " from statement to ") | ||
Line 767: | Line 923: | ||
if type(v) == "table" then | if type(v) == "table" then | ||
json[k] = p.expandJsonRef({json=v}).json | json[k] = p.expandJsonRef({json=v}).json | ||
end | |||
end | |||
local result = p.copy(json) | |||
for k,v in pairs(json) do | |||
if (k == "allOf") then | |||
if (type(v) == "table" and v[1] == nil) then v = {v} end -- ensure array | |||
for i,s in pairs(v) do | |||
result = p.tableMerge(s, result) | |||
if (debug) then mw.log("merge allOf with title " .. s["title"]) end | |||
end | |||
result[k] = nil | |||
end | end | ||
end | end | ||
return {json= | return {json=result} | ||
end | end | ||
function p.defaultArg(arg, default) | function p.defaultArg(arg, default) | ||
Line 850: | Line 1,019: | ||
--test: mw.logObject(p.tableMerge({"string", test1="test1", subtable1={"test"}}, {"string2", test1="test2", test3="test4"})) | --test: mw.logObject(p.tableMerge({"string", test1="test1", subtable1={"test"}}, {"string2", test1="test2", test3="test4"})) | ||
function p.tableMerge(t1, t2) | function p.tableMerge(t1, t2) | ||
if (t1 == nil) then t1 = {} elseif (type(t1) ~= 'table') then t1 = {t1} end | |||
if (t2 == nil) then t2 = {} elseif (type(t2) ~= 'table') then t2 = {t2} end | |||
for k,v in pairs(t2) do | for k,v in pairs(t2) do | ||
if type(v) == "table" then | if type(v) == "table" then | ||
Line 875: | Line 1,046: | ||
for k, v in pairs(obj) do res[p.copy(k, s)] = p.copy(v, s) end | for k, v in pairs(obj) do res[p.copy(k, s)] = p.copy(v, s) end | ||
return res | return res | ||
end | |||
-- build normalized multilang label | |||
function p.setNormalizedLabel(properties, use_fallbacks) | |||
if (use_fallbacks == nil) then use_fallbacks = true end | |||
if (properties['HasLabel'] ~= nil) then | |||
labels = properties['HasLabel'] | |||
if(type(labels) ~= 'table') then labels = {labels} end | |||
properties['HasNormalizedLabel'] = {} | |||
for i, label in ipairs(labels) do | |||
label_norm = p.splitString(label, '@')[1]:lower():gsub('[^%w]+','') | |||
label_lang = "en" | |||
if (p.splitString(label, '@')[2] ~= nil) then label_lang = p.splitString(label, '@')[2] end | |||
table.insert(properties['HasNormalizedLabel'], label_norm .. "@" .. label_lang) | |||
end | |||
elseif (use_fallbacks and properties['HasName'] ~= nil) then -- fallback, assume English lang | |||
labels = properties['HasName'] | |||
if(type(labels) ~= 'table') then labels = {labels} end | |||
properties['HasNormalizedLabel'] = {} | |||
for i, label in ipairs(labels) do | |||
label_norm = label:lower():gsub('[^%w]+','') | |||
table.insert(properties['HasNormalizedLabel'], label_norm .. "@en") | |||
end | |||
elseif (use_fallbacks and properties['Display title of'] ~= nil) then -- fallback, assume English lang | |||
labels = properties['Display title of'] | |||
if(type(labels) ~= 'table') then labels = {labels} end | |||
properties['HasNormalizedLabel'] = {} | |||
for i, label in ipairs(labels) do | |||
label_norm = label:lower():gsub('[^%w]+','') | |||
table.insert(properties['HasNormalizedLabel'], label_norm .. "@en") | |||
end | |||
end | |||
end | end | ||
return p | return p |
Revision as of 07:03, 13 November 2024
Documentation for this module may be created at Module:MwJson/doc
-- mw.logObject(p.processJsondata({jsondata=p.loadJson({title="Item:OSW7d7193567ea14e4e89b74de88983b718", slot="jsondata"}).json, debug=true, mode="header"}))
local lustache = require("Module:Lustache")
local p = {} --p stands for package
p.keys = { --jsonschema / json-ld keys
category='type',
category_pseudoproperty='Category', -- Property:Category
subcategory='subclass_of',
schema_type='schema_type',
property_ns_prefix='Property',
schema='osl_schema',
template='eval_template',
mode='mode',
context='@context',
allOf='allOf',
label='label',
name='name',
description='description',
text='text',
debug='_debug'
}
p.slots = { --slot names
main='main',
jsondata='jsondata',
jsonschema='jsonschema',
header_template='header_template',
footer_template='footer_template',
data_template='data_template'
}
p.mode = {
header='header',
footer='footer',
query='query'
}
p.cache = {}
--loads json from a wiki page
--test: mw.logObject(p.loadJson({title="JsonSchema:Entity"}))
--test: mw.logObject(p.loadJson({title="Category:Entity", slot="jsonschema"}))
function p.loadJson(args)
local page_title = p.defaultArg(args.title, "JsonSchema:Entity") --for testing
local slot = p.defaultArg(args.slot, 'main')
local debug = p.defaultArg(args.debug, nil)
local msg = ""
local json = {}
if p.cache[page_title] ~= nil then
if p.cache[page_title][slot] ~= nil then
if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsondata .. " of page " .. page_title .. " from cache <br>" end
json = p.cache[page_title][slot]
return {json=json, debug_msg=msg}
end
else p.cache[page_title] = {}
end
if (slot == 'main') then
--json = mw.loadJsonData( "JsonSchema:Entity" ) --requires MediaWiki 1.39
local page = mw.title.makeTitle(p.splitString(page_title, ':')[1], p.splitString(page_title, ':')[2])
local text = page:getContent()
if (text ~= nil) then json = mw.text.jsonDecode(text) end
else
if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsondata .. " of page " .. page_title .. "<br>" end
local text = mw.slots.slotContent( slot , page_title )
if (text ~= nil) then json = mw.text.jsonDecode(text) end
end
--mw.logObject(json)
p.cache[page_title][slot] = json
return {json=json, debug_msg=msg}
end
-- test: mw.logObject(p.walkJsonSchema({jsonschema=p.loadJson({title="Category:Hardware", slot="jsonschema"}).json, debug=true}).jsonschema)
function p.walkJsonSchema(args)
local jsonschema = p.defaultArg(args.jsonschema, {})
local jsonschemas = p.defaultArg(args.jsonschemas, {})
local categories = p.defaultArg(args.categories, nil)
local visited = p.defaultArg(args.visited, {})
local mode = p.defaultArg(args.mode, p.mode.header)
--local merged_jsonschema = p.defaultArg(args.merged_jsonschema, {})
local templates = p.defaultArg(args.templates, {})
local recursive = p.defaultArg(args.recursive, true)
local root = p.defaultArg(args.root, true)
local debug = p.defaultArg(args.debug, false)
local msg = ""
local wikitext = ""
local category_template_slot = nil
if (mode == p.mode.footer) then category_template_slot = p.slots.footer_template end
if (mode == p.mode.header) then category_template_slot = p.slots.header_template end
if (categories == nil) then categories = p.getCategories({jsonschema=jsonschema, includeNamespace=true}).categories end
if (type(categories) ~= 'table') then categories = {categories} end
if (debug) then msg = msg .. "Supercategories: " .. mw.dumpObject(categories) .. "\n<br>" end
for k, category in pairs(categories) do
if (not p.tableContains(visited, category)) then
--mw.logObject("Visit " .. category)
if (debug) then msg = msg .. "Fetch slot " .. p.slots.jsonschema .. " from page " .. category .. "\n<br>" end
local super_jsonschema_str = mw.slots.slotContent( p.slots.jsonschema , category )
if (super_jsonschema_str ~= nil) then
super_jsonschema = mw.text.jsonDecode( super_jsonschema_str )
if (recursive) then
local res = p.walkJsonSchema({jsonschema=super_jsonschema, jsonschemas=jsonschemas, templates=templates, mode=mode, visited=visited, root=false})
wikitext = wikitext .. res.wikitext
end
--table.insert(jsonschemas, mw.text.jsonDecode( super_jsonschema_str )) --keep a copy of the schema, super_jsonschema passed by references gets modified
--table.insert(jsonschemas, super_jsonschema )
--mw.logObject("Store " .. category)
table.insert(visited, category)
jsonschemas[category] = mw.text.jsonDecode( super_jsonschema_str ) --keep a copy of the schema, super_jsonschema passed by references gets modified
--jsonschema = p.tableMerge(jsonschema, super_jsonschema) --merge superschema is done by the caller
end
if (debug) then msg = msg .. "Fetch slot " .. category_template_slot .. " from page " .. category .. "\n<br>" end
templates[category] = mw.slots.slotContent( category_template_slot , category )
end
end
if (root) then
for i, category in ipairs(visited) do
--merge all schemas. we need to make a copy here, otherwise jsonschemas["Category:Entity"] contains the merged schema
jsonschema = p.copy(p.tableMerge(jsonschema, jsonschemas[category]))
end
end
if (debug) then wikitext = msg .. wikitext end
return {jsonschema=jsonschema, jsonschemas=jsonschemas, templates=templates, visited=visited, wikitext=wikitext}
end
--[[ test:
category = "Category:Hardware"
page = "Item:OSW7d7193567ea14e4e89b74de88983b718"
category2 = "Category:OSW80e240a2e17d4ae5adfe6419051aa0bb"
page2 = "Item:OSWa4da6664aeac466a86b09e6b32a1cb41"
mw.logObject(p.expandEmbeddedTemplates({
jsonschema=p.walkJsonSchema({jsonschema=p.loadJson({title=category, slot="jsonschema"}).json, debug=true}).jsonschema,
jsondata=p.loadJson({title=page, slot="jsondata"}).json,
debug=true, mode="render"
}).res)
--]]
function p.expandEmbeddedTemplates(args)
local frame = p.defaultArg(args.frame, mw.getCurrentFrame())
local jsondata = p.defaultArg(args.jsondata, {})
local jsonschema = p.defaultArg(args.jsonschema, {})
local template = p.defaultArg(args.template, nil)
local mode = p.defaultArg(args.mode, nil)
local stringify_arrays = p.defaultArg(args.stringify_arrays, false)
local msg = ""
local res = p.defaultArg(args.jsondata, "")
for k,v in pairs(jsondata) do
local eval_template = nil
local eval_templates = p.defaultArgPath(jsonschema, {"properties", k, p.keys.template}, {})
if (eval_templates[1] == nil) then eval_templates = {eval_templates} end --ensure list of objects
for i, t in pairs(eval_templates) do
if (t[p.keys.mode] ~= nil and t[p.keys.mode] == mode) then eval_template = t --use only render templates in render mode and store templates in store mode
elseif (t[p.keys.mode] == nil) then eval_template = t --default
elseif (debug) then msg = msg .. "Ignore eval_template" .. mw.dumpObject( t ) .. "\n<br>"
end
end
if (eval_template ~= nil and eval_template.value ~= nil and (eval_template.type == "mustache" or eval_template.type == "mustache-wikitext")) then
-- mustache can handle objects and array to we can parse it directly
-- todo: handle nested templates
local template_param = {[k]=v}
if (eval_template.root_key == false) then template_param = v end
if (debug) then msg = msg .. "Parse mustache template " .. eval_template.value .. " with params " .. mw.dumpObject( template_param ) .. "\n<br>" end
jsondata[k] = lustache:render(eval_template.value, template_param, p.tableMerge({self=eval_template.value}, eval_template.partials)) -- render with self as registered partial for recursion
if (eval_template.type == "mustache-wikitext") then
jsondata[k] = frame:preprocess( jsondata[k] )
end
elseif type(v) == 'table' then
if (v[1] == nil) then --key value array = object/dict
local sub_res = p.expandEmbeddedTemplates({frame=frame, jsondata=v, jsonschema=p.defaultArgPath(jsonschema, {"properties", k}, {}), template=eval_template, mode=mode, stringify_arrays=stringify_arrays})
msg = msg .. sub_res.debug_msg
jsondata[k] = sub_res.res
--if (sub_res.unparsed ~= nil) then jsondata[k] = sub_res.unparsed else jsondata[k] = sub_res.wikitext end
else --list array
local string_list = ""
for i,e in pairs(v) do
local eval_template = nil
local eval_templates = p.defaultArgPath(jsonschema, {"properties", k, "items", p.keys.template}, {})
if (eval_templates[1] == nil) then eval_templates = {eval_templates} end --ensure list of objects
for i, t in pairs(eval_templates) do
if (t[p.keys.mode] ~= nil and t[p.keys.mode] == mode) then eval_template = t --use only render templates in render mode and store templates in store mode
elseif (t[p.keys.mode] == nil) then eval_template = t --default
elseif (debug) then msg = msg .. "Ignore eval_template" .. mw.dumpObject( t ) .. "\n<br>"
end
end
if type(e) == 'table' then
local sub_res = p.expandEmbeddedTemplates({frame=frame, jsondata=e, jsonschema=p.defaultArgPath(jsonschema, {"properties", k, "items"}, {}), template=eval_template, mode=mode, stringify_arrays=stringify_arrays})
msg = msg .. sub_res.debug_msg
if (type(sub_res.res) == 'table') then
if (debug) then msg = msg .. "Values for " .. k .. " contains non-literal items: " .. mw.dumpObject( sub_res.res ) .. " => skip value in wikitemplate array param creation\n<br>" end
else
if (stringify_arrays) then string_list = string_list .. sub_res.res .. ";"
else v[i] = sub_res.res end
end
else
if (eval_template ~= nil and eval_template.value ~= nil) then
--evaluate single array item string as json {"self": "<value>", ".": "<value>"} => does not work since jsondata is an object
--e = p.expandEmbeddedTemplates({frame=frame, jsondata={["self"]=e,["."]=e}, jsonschema=p.defaultArgPath(jsonschema, {"properties", k, "items"}, {}), template=eval_template, mode=mode, stringify_arrays=stringify_arrays})
if (eval_template.type == "mustache" or eval_template.type == "mustache-wikitext") then
if (debug) then msg = msg .. "Parse mustache template " .. eval_template.value .. " with params " .. mw.dumpObject( e ) .. "\n<br>" end
-- {{.}} in the template will be the value of e
e = lustache:render(eval_template.value, e, p.tableMerge({self=eval_template.value}, eval_template.partials)) -- render with self as registered partial for recursion
end
if (eval_template.type == "mustache-wikitext") then --or eval_template.type == "wikitext") then
if (debug) then msg = msg .. "Parse wikitext template " .. e .. " with params " .. mw.dumpObject( e ) .. "\n<br>" end
e = frame:preprocess( e )
end
v[i] = e -- update array
end
if (stringify_arrays) then string_list = string_list .. e .. ";" end
end
end
if (stringify_arrays) then jsondata[k] = string_list end
end
end
end
if (template == nil) then
local templates = jsondata[p.keys.template]
if (templates == nil) then templates = p.defaultArg(jsonschema[p.keys.template], {}) end
if (templates[1] == nil) then templates = {templates} end --ensure list of objects
for i, t in pairs(templates) do
if (t[p.keys.mode] ~= nil and t[p.keys.mode] == mode) then template = t --use only render templates in render mode and store templates in store mode
elseif (t[p.keys.mode] == nil) then template = t --default
elseif (debug) then msg = msg .. "Ignore template" .. mw.dumpObject( t ) .. "\n<br>"
end
end
end
if template ~= nil then
if (template.type == "wikitext") then
for k,v in pairs(jsondata) do
if type(v) == 'table' then
if (debug) then msg = msg .. "Values for " .. k .. " contains non-literals: " .. mw.dumpObject( v ) .. " => skip wikitemplate parsing\n<br>" end
return {res=res, debug_msg=msg}
end --not supported
end
if (template.value ~= nil) then
if (debug) then msg = msg .. "Parse wikitemplate " .. template.value .. " with params " .. mw.dumpObject( jsondata ) .. "\n<br>" end
local child = frame:newChild{args=jsondata}
res = child:preprocess( template.value )
elseif (template.page ~= nil) then
if (debug) then msg = msg .. "Parse wikitemplate " .. template.page .. " with params " .. mw.dumpObject( jsondata ) .. "\n<br>" end
res = frame:expandTemplate{ title = template.page, args = jsondata }
end
end
end
--if (debug) then mw.logObject(msg) end
return {res=res, debug_msg=msg}
end
-- mw.logObject(p.processJsondata({jsondata=p.loadJson({title="Item:OSW7d7193567ea14e4e89b74de88983b718", slot="jsondata"}).json, debug=true, mode="header"}))
-- mw.logObject(p.processJsondata({jsondata=p.loadJson({title="Item:OSWa4da6664aeac466a86b09e6b32a1cb41", slot="jsondata"}).json, debug=true, mode="header"}))
-- mw.logObject(p.processJsondata({jsondata=p.loadJson({title="Category:OSWb3022bbf7e7146eb8e6f6e3264f50bbe", slot="jsondata"}).json, debug=true, mode="header", categories={"Category:Category"}}))
function p.processJsondata(args)
local frame = p.defaultArg(args.frame, mw.getCurrentFrame())
local jsondata = p.defaultArg(args.jsondata, {})
local jsonschema = p.defaultArg(args.jsonschema, {})
local template = p.defaultArg(args.template, nil)
local categories = p.defaultArg(args.categories, nil)
local recursive = p.defaultArg(args.recursive, true)
local mode = p.defaultArg(args.mode, p.mode.header)
local debug = p.defaultArg(args.debug, false)
local title = mw.title.getCurrentTitle()
local wikitext = ""
local msg = "" --debug msg
if (p.nilOrEmpty(jsondata) or (p.nilOrEmpty(categories) and p.nilOrEmpty(jsonschema) and p.nilOrEmpty(jsondata[p.keys.category]))) then return {wikitext=wikitext, debug_msg=msg} end --nothing to do here
--if (jsondata == nil or p.tableLength(jsondata) == 0 or (categories == nil and jsonschema == nil and jsondata[p.keys.category] == nil)) then return {wikitext=wikitext, debug_msg=msg} end --nothing to do here
--jsonschema = p.defaultArg(jsonschema, {})
--jsondata = p.defaultArg(jsondata, {})
--if (categories == nil) then categories = jsondata[p.keys.category] end -- let function param overwrite json property
if (not p.nilOrEmpty(jsondata[p.keys.category])) then categories = jsondata[p.keys.category] end -- let json property overwrite function param
local schema_res = p.walkJsonSchema({jsonschema=jsonschema, categories=categories, mode=mode, recursive=recursive, debug=debug})
local expand_res = p.expandJsonRef({json=schema_res.jsonschema, debug=debug})
jsonschema = expand_res.json
--mw.log(mw.text.jsonEncode(jsonschema))
local display_label = p.defaultArgPath(jsondata, {p.keys.name}, "")
if (display_label == "" or (title.nsText ~= "Category" and title.nsText ~= "Property")) then
display_label = p.defaultArgPath(jsondata, {p.keys.label, 1, p.keys.text}, "") --prefere label for all non-category and non-property pages
end
local jsonld = p.copy(jsondata)
local json_data_store = p.copy(jsondata)
local json_data_render = p.copy(jsondata)
json_res_store = p.expandEmbeddedTemplates({jsonschema=jsonschema, jsondata=json_data_store, mode='store'})
msg = msg .. json_res_store.debug_msg
--mw.log("JSONDATA STORE")
--mw.logObject(json_res_store.res)
local smw_res = nil
if (mode == p.mode.header) then
-- get the semantic properties by looking up the json keys in the json-ld context
smw_res = p.getSemanticProperties({jsonschema=jsonschema, jsondata=json_res_store.res, store=false, debug=debug})
-- store metadata where properties were defined / overridden
for i, category in ipairs(schema_res.visited) do
for k, v in pairs(schema_res.jsonschemas[category]['properties']) do
if smw_res.definitions[k] == nil then smw_res.definitions[k] = {} end
if smw_res.definitions[k]['defined_in'] == nil then smw_res.definitions[k]['defined_in'] = {} end
table.insert(smw_res.definitions[k]['defined_in'], category)
end
end
-- embed json-ld in resulting html for search engine discovery
jsonld["@context"] = smw_res.context
jsonld["@type"] = p.tableMerge(p.tablefy(jsonschema.schema_type), p.tablefy(jsonld["@type"])) --
jsonld['schema:name'] = p.defaultArgPath(jsonld, {p.keys.label, 1, p.keys.text}, jsonld['name']) --google does not support @value and @lang
jsonld['schema:description'] = p.defaultArgPath(jsonld, {p.keys.description, 1, p.keys.text}, nil)
for k, v in pairs(jsonld) do
if (type(v) == "string") then
local vpart = p.splitString(v, ':')
if (p.tableLength(vpart) == 2 and vpart[1] == "File") then jsonld[k] = mw.getCurrentFrame():callParserFunction( 'filepath', { vpart[2] } ) end --google does not follow redirects via "File":"wiki:Special:Redirect/file/"
end
end
wikitext = wikitext .. "<div class='jsonld-header' style='display:none' data-jsonld='" .. mw.text.jsonEncode( jsonld ):gsub("'","`") .. "'></div>"
end
local json_res = p.expandEmbeddedTemplates({jsonschema=jsonschema, jsondata=json_data_render, mode='render'})
msg = msg .. json_res.debug_msg
jsondata =json_res.res
--mw.log("JSONDATA RENDER")
--mw.logObject(jsondata)
local max_index = p.tableLength(schema_res.visited)
for i, category in ipairs(schema_res.visited) do
if (mode == p.mode.footer) then category = schema_res.visited[max_index - i +1] end --reverse order for footer templates
local super_jsonschema = schema_res.jsonschemas[category]
local template = schema_res.templates[category]
if (template ~= nil) then
if (debug) then msg = msg .. "Parse \n\n" .. template .. " \n\nwith params " .. mw.dumpObject( jsondata ) .. "\n<br>" end
local stripped_jsondata={}
for k, v in pairs(jsondata) do
if (type(v) ~= 'table') then stripped_jsondata[k] = v end --delete object values, not supported by wiki templates
end
local child = frame:newChild{args=stripped_jsondata}
if ( template:sub(1, #"=") == "=" ) then template = "\n" .. template end -- add line break if template starts with heading (otherwise not rendered by mw parser)
wikitext = wikitext .. child:preprocess( template )
elseif (mode == p.mode.header) then
local ignore_properties = {[p.keys.category]=true} -- don't render type/category on every subclass
for j, subcategory in ipairs(schema_res.visited) do
if j > i then
local subjsonschema = schema_res.jsonschemas[subcategory]
for k, v in pairs(subjsonschema['properties']) do
-- skip properties that are overwritten in subschemas, render them only once at the most specific position
ignore_properties[k] = true
end
end
end
-- render the infobox for the schema itself and every super_schema using always the global json-ld context (merged within walkJsonSchema())
-- context needs to be preprocessed with buildContext() since the generic json/table merge of the @context atttribute produces a list of strings (remote context) and context objects
-- context is already build in p.getSemanticProperties. schema_allOfMerged is used to provide the full schema for overridden properties
local infobox_res = p.renderInfoBox({jsonschema=super_jsonschema, schema_allOfMerged=jsonschema, context=smw_res.context, property_definitions=smw_res.definitions, jsondata=jsondata, ignore_properties=ignore_properties})
wikitext = wikitext .. frame:preprocess( infobox_res.wikitext )
end
end
--local display_label = ""
--if (jsondata[p.keys.label] ~= nil) then display_label = p.splitString(jsondata[p.keys.label], '@')[1] end
local set_categories_in_wikitext = {}
p.tableMerge(set_categories_in_wikitext, json_res_store.res[p.keys.subcategory]) --classes/categories, nil for items
if (title.nsText ~= "Category") then --items
p.tableMerge(set_categories_in_wikitext, json_res_store.res[p.keys.category]) -- categories from schema type
end
-- Todo: Consider moving the category and this block to p.getSemanticProperties with store=true. However, settings categories with @category is only possible for subobjects
if (smw_res ~= nil) then
if (debug) then msg = msg .. "Store page properties" end
-- category handling
p.tableMerge(set_categories_in_wikitext, smw_res.properties[p.keys.category_pseudoproperty])
smw_res.properties[p.keys.category_pseudoproperty] = nil -- delete pseudo property
smw_res.properties['HasOswId'] = mw.title.getCurrentTitle().fullText --set special property OswId to own title
-- label and display title handling
smw_res.properties['Display title of'] = display_label --set special property display title
smw_res.properties['Display title of lowercase'] = display_label:lower() --store lowercase for case insensitive query
smw_res.properties['Display title of normalized'] = display_label:lower():gsub('[^%w]+','') --store with all non-alphanumeric chars removed for normalized query
p.setNormalizedLabel(smw_res.properties) --build normalized multilang label
mw.ext.displaytitle.set(display_label)
--smw_res.properties['@category'] = jsondata[p.keys.category]
local store_res = mw.smw.set( smw_res.properties ) --store as semantic properties
if (debug) then msg = msg .. mw.dumpObject(smw_res.properties) end
if (store_res) then
if (debug) then msg = msg .. "SMW SUCCESS: " end
else
wikitext = wikitext .. store_res.error
if (debug) then msg = msg .. "SMW ERROR: " .. store_res.error end
end
--wikitext = mw.dumpObject(smw_res.properties) .. wikitext
end
wikitext = wikitext .. "\n" .. p.setCategories({categories=set_categories_in_wikitext, sortkey=display_label}).wikitext
if (debug) then mw.logObject(res) end
return {wikitext=wikitext, debug_msg=msg}
end
-- renders a default infobox
-- test: mw.logObject(p.renderInfoBox({jsonschema=p.loadJson({title="JsonSchema:Entity"}).json, jsondata={uuid="123123"}}))
function p.renderInfoBox(args)
local debug = p.defaultArg(args.debug, false)
local jsondata = p.defaultArg(args.jsondata, {})
local schema = p.defaultArg(args.jsonschema, nil) -- local schema from the perspective of the current category
local schema_allOfMerged = p.defaultArg(args.schema_allOfMerged, schema) -- global schema with allOfs merged
local property_definitions = p.defaultArg(args.property_definitions, {}) -- dict schema_key: {property: <smw_property>, ...}
local res = ""
if schema == nil then return res end
local context = p.defaultArg(args.context, p.buildContext({jsonschema=schema}).context)
local ignore_properties = p.defaultArg(args.ignore_properties, {})
local schema_label = ""
if schema['title'] ~= nil then schema_label = schema['title'] end
-- see also: https://help.fandom.com/wiki/Extension:Scribunto/HTML_Library_usage_notes
local tbl = mw.html.create( 'table' )
tbl
:attr( 'class', 'info_box' )
:tag( 'tr' )
:tag( 'th' )
:attr( 'class', 'heading' )
:attr( 'colspan', '2' )
:wikitext( schema_label )
for k,v in pairs(jsondata) do
if (not ignore_properties[k]) then
if (schema['properties'] ~= nil and schema['properties'][k] ~= nil and (type(v) ~= 'table' or v[1] ~= nil)) then --literal or literal array
local def = schema_allOfMerged['properties'][k]
--mw.logObject(def)
local label = k
if def['title'] ~= nil then label = def['title'] end
if def['title*'] ~= nil then -- multilang label with switch
label = "{{#switch:{{USERLANGUAGECODE}} |#default=" .. label
for k,v in pairs(def['title*']) do label = label .. " |" .. k .. "=" .. v end
label = label .. " }}"
end
local description = ""
if def['description'] ~= nil then description = def['description'] end
if def['description*'] ~= nil then -- multilang label with switch
description = "{{#switch:{{USERLANGUAGECODE}} |#default=" .. description
for k,v in pairs(def['description*']) do description = description .. " |" .. k .. "=" .. v end
description = description .. " }}"
end
if (p.tableLength(p.defaultArgPath(property_definitions, {k, 'defined_in'}, {})) > 0) then description = description .. "<br>Definition: " end
for i, c in pairs(p.defaultArgPath(property_definitions, {k, 'defined_in'}, {})) do
if (i > 1) then description = description .. ", " end
description = description .. "[[:" ..c .. "]]"
end
if (description ~= "") then description = "{{#info: " .. description .. "|note }}" end -- smw tooltip
label = label .. description
--res = res .. title ": " .. v
local cell = tbl:tag( 'tr' )
:tag( 'th' )
:wikitext( label )
:done()
:tag( 'td' )
if (type(v) == 'table') then
for i,e in pairs(v) do
if (type(e) ~= 'table') then
local p_type = p.defaultArgPath(context, {k, '@type'}, '@value')
if (p_type == '@id' and p.defaultArgPath(def, {'items', 'type'}, 'unknown') == 'string' and def['eval_template'] == nil) then
-- auto-link (OSW-)IDs if no eval_template is present
e = string.gsub(e, "Category:", ":Category:") -- make sure category links work
e = string.gsub(e, "File:", ":File:") -- do not embedd images but link to them
e = "[[" .. e .. "]]"
elseif (p_type == 'xsd:date') then -- formate date with user preferences
e = "{{#dateformat:" .. e .. "|ymd}}"
elseif (p_type == 'xsd:dateTime') then -- formate time with user preferences
local smw_property = p.defaultArgPath(property_definitions, {k, 'property'})
if (smw_property ~= nil) then e = "{{#ask: [[{{FULLPAGENAME}}]]|?" .. smw_property .. "#LOCL#TO= |format=plain |mainlabel=-}}"
else
local _, _, date, hours, minutes = string.find(e, "(%S+)[T ](%S+)[:](%S+)[:?]")
e = "{{#dateformat:" .. date .. "|ymd}} " .. hours .. ":" .. minutes .. " (UTC)"
end
elseif (type(v) == 'boolean') then
if (v) then v = "✅" else v = "❌" end -- green check mark or red cross
elseif ((string.len(e) > 100) and (string.find(e, "{{") == nil) and (string.find(e, "</") == nil)) then
e = string.sub(e, 1, 100) .. "..."; -- limit infobox plain text to max 100 chars
elseif (debug) then
mw.log("Unformated: " .. k .. " " .. p.defaultArgPath(def, {'items', 'type'}, 'unknown'))
mw.logObject(def)
end
cell:wikitext("\n* " .. e .. "")
end
end
else
local p_type = p.defaultArgPath(context, {k, '@type'}, '@value')
if (p_type == '@id' and p.defaultArgPath(def, {'type'}, 'unknown') == 'string' and def['eval_template'] == nil) then
-- auto-link (OSW-)IDs if no eval_template is present
v = string.gsub(v, "Category:", ":Category:") -- make sure category links work
v = string.gsub(v, "File:", ":File:") -- do not embedd images but link to them
v = "[[" .. v .. "]]"
elseif (p_type == 'xsd:date') then -- formate date & time with user preferences
v = "{{#dateformat:" .. v .. "|ymd}}"
elseif (p_type == 'xsd:dateTime') then -- formate time with user preferences
local smw_property = p.defaultArgPath(property_definitions, {k, 'property'})
if (smw_property ~= nil) then v = "{{#ask: [[{{FULLPAGENAME}}]]|?" .. smw_property .. "#LOCL#TO= |format=plain |mainlabel=-}}"
else
local _, _, date, hours, minutes = string.find(v, "(%S+)[T ](%S+)[:](%S+)[:?]")
v = "{{#dateformat:" .. date .. "|ymd}} " .. hours .. ":" .. minutes .. " (UTC)"
end
elseif (type(v) == 'boolean') then
if (v) then v = "✅" else v = "❌" end -- green check mark or red cross
elseif ((string.len(v) > 100) and (string.find(v, "{{") == nil) and (string.find(v, "</") == nil)) then
v = string.sub(v, 1, 100) .. "..."; -- limit infobox plain text to max 100 chars
elseif (debug) then
mw.log("Unformated: " .. k .. " " .. p.defaultArgPath(def, {'type'}, 'unknown'))
mw.logObject(def)
end
cell:wikitext("\n" .. v .. "")
end
end
end
end
res = res .. tostring( tbl )
--mw.logObject(res)
return {wikitext=res}
end
-- test
-- mw.logObject(p.getCategories({jsonschema={allOf={["$ref"]="/wiki/Category:Test?action=raw&slot=jsonschema"}}, includeNamespace=true}))
-- mw.logObject(p.getCategories({jsonschema={allOf={{["$ref"]="/wiki/Category:Test?action=raw&slot=jsonschema"}, {["$ref"]="/wiki/Category:Test2?action=raw&slot=jsonschema"}}}}))
function p.getCategories(args)
local jsonschema = p.defaultArg(args.jsonschema, {})
local includeNamespace = p.defaultArg(args.includeNamespace, false)
local categories = {}
local allOf = jsonschema[p.keys.allOf]
if (allOf ~= nil) then
--properties['@category'] = {}
for k, entry in pairs(allOf) do
if type(entry) == 'table' then -- "allOf": [{"$ref": "/wiki/Category:Test?action=raw"}]
for p, v in pairs(entry) do
if (p == '$ref') then
for category in v:gmatch("Category:([^?]+)") do -- e.g. "/wiki/Category:Test?action=raw"
if (includeNamespace) then category = "Category:" .. category end
table.insert(categories, category)
end
end
end
else -- "allOf": {"$ref": "/wiki/Category:Test?action=raw"}
if (k == '$ref') then
for category in entry:gmatch("Category:([^?]+)") do -- e.g. "/wiki/Category:Test?action=raw"
if (includeNamespace) then category = "Category:" .. category end
table.insert(categories, category)
end
end
end
end
end
return {categories=categories}
end
--sets a list of categories on the page
--test: mw.logObject(p.setCategories({categories={"Cat1", "Category:Cat2"}}))
function p.setCategories(args)
local categories = p.defaultArg(args.categories, {})
local sortkey = p.defaultArg(args.sortkey, "")
if (sortkey ~= "") then sortkey = "|" .. sortkey end
if (type(categories) ~= 'table') then categories = {categories} end
local res = ""
for k, entry in pairs(categories) do
res = res .. "[[Category:" .. string.gsub(entry, "Category:", "") .. sortkey .."]]"
end
return {wikitext=res}
end
--[[ test
category = "Category:Entity"
jsonschema = p.expandJsonRef({json=p.loadJson({title=category, slot="jsonschema"}).json}).json
mw.logObject(p.buildContext({jsonschema=jsonschema, debug=true}))
mw.log(mw.text.jsonEncode(p.buildContext({jsonschema=jsonschema, debug=false}).context))
or
jsonschema = {
["@context"]={test="level 0"},
properties={
test={
type="object",
["@context"]={test1="level 1"},
properties= {
test= {
type="array",
items= {
type="object",
["@context"]={test2="level 2"}
}
}
}
}
}
}
mw.logObject(p.buildContext({jsonschema=jsonschema, debug=true}))
--]]
-- constructs a property specific local jsonld context
function p.buildContext(args)
local schema = p.defaultArg(args.jsonschema, {})
--mw.logObject(schema)
local context = p.defaultArg(args.context, schema[p.keys.context])
local result = p.defaultArg(args.result, {})
if (context ~= nil) then
for k,v in pairs(context) do
if type(k) == 'number' and type(v) == 'string' then
--table.insert(result, v) --skip context imports
elseif (type(v) == 'table' and v[1] ~= nil) then --custom addtional mappings, e. g. "type*": ["Property:HasType"]
result[k] = v
elseif (type(v) == 'table' and v['@id'] == nil and v['@reverse'] == nil) then --subcontext
p.tableMerge(result, p.buildContext({context=v}).context)
else
result[k] = v
end
end
end
local properties = p.defaultArg(schema.properties, {})
-- build property context
for k,v in pairs(properties) do
local subcontext = nil
if (p.defaultArgPath(properties, {k, 'type'}) == 'object') then
--mw.logObject(properties[k])
subcontext = p.buildContext({jsonschema=properties[k]}).context
elseif (p.defaultArgPath(properties, {k, 'items', 'type'}) == 'object') then
--mw.logObject(properties[k]['items'])
subcontext = p.buildContext({jsonschema=properties[k]['items']}).context
end
if (subcontext ~= nil and p.tableLength(subcontext) > 0) then
if (result[k] == nil) then result[k] = {} end
if (type(result[k]) == 'string') then result[k] = {["@id"]=result[k]} end
if (result[k][p.keys.context] == nil) then result[k][p.keys.context] = {} end
result[k][p.keys.context] = p.tableMerge(result[k][p.keys.context], subcontext)
end
end
return {context=result}
end
--maps jsondata values to semantic properties by using the @context attribute within the schema
--test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={test="Property:schema:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true}))
--test: mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={"some uri",{test="Property:TestProperty", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}}, jsondata={test="TestValue", myObjectProperty="123"}, debug=true}))
--[[
mw.logObject(p.getSemanticProperties({jsonschema={["@context"]={test="Property:TestProperty", subobject="Property:HasSubobject", myObjectProperty={["@id"]= "Property:MyObjectProperty", ["@type"]= "@id"}}}, jsondata={
test="TestValue", myObjectProperty="123", subobject={uuid="123-123-123", test="TestValue2"}
}, debug=true}))
mw.logObject(p.getSemanticProperties({jsonschema=p.loadJson({title="Category:OSW80e240a2e17d4ae5adfe6419051aa0bb", slot="jsonschema"}).json, p.loadJson({title="Item:OSWa4da6664aeac466a86b09e6b32a1cb41", slot="jsonsdata"}).json, debug=true}))
category = "Category:Hardware"
page = "Item:OSW7d7193567ea14e4e89b74de88983b718"
category2 = "Category:OSW80e240a2e17d4ae5adfe6419051aa0bb"
page2 = "Item:OSWa4da6664aeac466a86b09e6b32a1cb41"
jsonschema =p.walkJsonSchema({jsonschema=p.loadJson({title=category, slot="jsonschema"}).json, debug=true}).jsonschema
mw.logObject(p.getSemanticProperties({
jsonschema=jsonschema,
jsondata=p.expandEmbeddedTemplates({jsonschema=jsonschema, jsondata=p.loadJson({title=page, slot="jsondata"}).json}).res,
debug=true
}).properties)
--]]
function p.getSemanticProperties(args)
local jsondata = p.defaultArg(args.jsondata, {})
local schema = p.defaultArg(args.jsonschema, {})
local subschema = p.defaultArg(args.subschema, schema)
local parent_schema_property = p.defaultArg(args.parent_schema_property, {}) -- ToDo: Not used except in getSemanticQuery => remove
local store = p.defaultArg(args.store, false)
local root = p.defaultArg(args.root, true)
local properties = p.defaultArg(args.properties, {}) --semantic properties to store, dict key=property_name, value=array of string values
local debug = p.defaultArg(args.debug, false)
--if (debug) then mw.logObject("Call getSemanticProperties with args " .. mw.dumpObject( args ) .. "\n<br>") end
local subjectId = mw.title.getCurrentTitle().fullText
local subobjectId = nil
if (root == false and jsondata['uuid'] ~= nil) then
subobjectId = "OSW" .. string.gsub(jsondata['uuid'], "-", "")
subjectId = subjectId .. '#' .. subobjectId
end
local property_data = {}
local context = p.defaultArg(args.context, p.buildContext({jsonschema=schema}).context)
local error = ""
if (debug) then mw.logObject(context) end
if schema ~= nil and context ~= nil then
local schema_properties = p.defaultArg(subschema.properties, {})
if (debug and root) then
for k,v in pairs(context) do
if type(k) == 'number' then mw.logObject("imports " .. v)
elseif type(v) == 'table' and v["@id"] ~= nil then mw.logObject("" .. k .. " maps to " .. v["@id"])
else mw.logObject("" .. k .. " maps to " .. mw.dumpObject(v)) end
end
end
for k,v in pairs(jsondata) do
local property_names = {}
local subobject_properties = {} -- reverse properties to store in the subobject
local mapping_found = false
local property_definitions = {} -- list of objects {id=..., reverse=...}
for term, def in pairs(context) do
local term_parts = p.splitString(term, "*")
if (term_parts[1] == k) then --custom additional mapping term*(*...): "Property:..."
if type(def) == 'table' then
-- note: json-ld allows only @id OR @reverse
if (def["@id"] ~= nil) then table.insert(property_definitions, {id=def["@id"], reverse=false}) end
if (def["@reverse"] ~= nil) then table.insert(property_definitions, {id=def["@reverse"], reverse=true}) end
else table.insert(property_definitions, {id=def}) end
end
end
if (debug) then mw.logObject(property_definitions) end
for i,e in ipairs(property_definitions) do
local id = e["id"]
local property_definition = p.splitString(id, ':')
if property_definition[1] == p.keys.property_ns_prefix then
mapping_found = true
property_name = string.gsub(id, p.keys.property_ns_prefix .. ":", "") -- also allow prefix properties like: Property:schema:url
if (e["reverse"]) then -- reverse properties are handled in the respective subobject
if (subobject_properties[property_name] == nil) then subobject_properties[property_name] = {} end --initialize empty list
table.insert(subobject_properties[property_name], subjectId) -- add triple subobject -property-> subject
else table.insert(property_names, property_name) end
local schema_property = p.defaultArg(schema_properties[k], {})
local schema_type = p.defaultArg(schema_property.type, nil) --todo: also load smw property type on demand
property_data[k] = {schema_type=schema_type, schema_data=schema_property, property=property_name, value=v, reverse=e["reverse"]}
end
end
for i, property_name in ipairs(property_names) do
if (properties[property_name] == nil) then properties[property_name] = {} end --initialize empty list
end
if type(v) == 'table' then
--if (debug) then mw.logObject("prop " .. k .. " = " .. mw.dumpObject(v)) end
if (mapping_found) then
local subcontext = p.copy(p.defaultArgPath(context, {k, p.keys.context}, {})) --deepcopy, see also https://phabricator.wikimedia.org/T269990
context = p.tableMerge(context, subcontext) -- pull up nested context
local values = {}
if (v[1] == nil) then --key value array = object/dict
local subproperties_res = p.getSemanticProperties({jsonschema=schema, jsondata=v, properties=p.copy(subobject_properties), store=true, root=false, debug=debug, context=context, subschema=schema_properties[k], parent_schema_property=property_data[k]})
local id = subproperties_res.id --subobject_id
if (id ~= nil) then
id = mw.title.getCurrentTitle().fullText .. '#' .. id
table.insert(values, id)
end
properties = p.processStatement({subject=properties, statement=subproperties_res.properties, debug=debug}).subject
else --list array
for i, e in pairs(v) do
if (type(e) == 'table') then
local subproperties_res = p.getSemanticProperties({jsonschema=schema, jsondata=e, properties=p.copy(subobject_properties), store=true, root=false, debug=debug, context=context, subschema=schema_properties[k], parent_schema_property=property_data[k]})
local id = subproperties_res.id --subobject_id
if (id ~= nil) then
id = mw.title.getCurrentTitle().fullText .. '#' .. id
table.insert(values, id)
end
properties = p.processStatement({subject=properties, statement=subproperties_res.properties, debug=debug}).subject
else values = v end --plain strings
end
end
for pi, property_name in ipairs(property_names) do
for i,value in pairs(values) do table.insert(properties[property_name], value) end
if (debug) then mw.logObject("set " .. property_name .. " = " .. mw.dumpObject(values)) end
end
else if (debug) then mw.logObject("not mapped: " .. k .. " = " .. mw.dumpObject(v)) end
end
else
if (mapping_found) then
for pi, property_name in ipairs(property_names) do
table.insert(properties[property_name], v)
if (debug) then mw.logObject("set " .. property_name .. " = " .. mw.dumpObject(v)) end
end
else
if (debug) then mw.logObject("not mapped: " .. k .. " = " .. mw.dumpObject(v)) end
end
end
end
end
local store_res = nil
if (store) then
properties['HasOswId'] = subjectId
if (root) then
if (debug) then mw.logObject("Store page properties") end
store_res = mw.smw.set( properties ) --store as semantic properties
else
properties['@category'] = {}
p.tableMerge(properties['@category'], jsondata[p.keys.category]) -- from json property 'type'
p.tableMerge(properties['@category'], properties[p.keys.category_pseudoproperty]) -- from json-ld context 'Property:Category'
properties[p.keys.category_pseudoproperty] = nil -- delete pseudo property
if (jsondata[p.keys.name] ~= nil) then properties['Display title of'] = jsondata[p.keys.name]
elseif (jsondata[p.keys.label] ~= nil and jsondata[p.keys.label][1] ~= nil) then properties['Display title of'] = p.splitString(jsondata[p.keys.label][1], '@')[1]
else properties['Display title of'] = p.defaultArg(subschema['title'], "") end
p.setNormalizedLabel(properties) --build normalized multilang label
if (p.tableLength(properties) > 0) then
store_res = mw.smw.subobject( properties, subobjectId ) --store as subobject
if (debug) then mw.logObject("Store subobject with id " .. (subobjectId or "<random>")) end
end
end
end
if (debug) then mw.logObject(properties) end
if (store_res ~= nil) then
if (not store_res and store_res.error ~= nil) then error = error .. store_res.error end
end
if (debug) then mw.logObject(error) end
return {properties=properties, definitions=property_data, id=subobjectId, context=context, error=error}
end
function p.processStatement(args)
local statement = p.defaultArg(args.statement)
local subject = p.defaultArg(args.subject)
local debug = p.defaultArg(args.debug, false)
-- handle "approved" statements
if (statement["HasSubject"] == nil or statement["HasSubject"][1] == nil or statement["HasSubject"][1] == "") then --implicit subject
if (statement["HasProperty"] ~= nil and statement["HasProperty"][1] ~= nil and statement["HasProperty"][1] ~= "" and statement["HasObject"] ~= nil) then
local property = string.gsub(statement["HasProperty"][1], p.keys.property_ns_prefix .. ":", "") -- also allow prefix properties like: Property:schema:url
if (debug) then
mw.log("Set property " .. property .. " from statement to ")
mw.logObject(statement["HasObject"])
end
if (subject[property] == nil) then subject[property] = {} end
for k, v in pairs(statement["HasObject"]) do table.insert(subject[property], v) end
end
end
return {subject=subject}
end
-- build a semantic query based on provided properties and their schema definition
--[[ test:
mw.logObject(p.getSemanticQuery({
jsonschema={
["@context"]={
test="Property:TestProperty",
number_max="Property:HasNumber",
date_min="Property:HasDate"
},
properties={
test={title="Test", type="string"},
number_max={title="Number", type="string", format="number", options={role={query={filter="max"}}}},
date_min={title="Date", type="string", format="date", options={role={query={filter="min"}}}},
}
},
jsondata={test="TestValue", number_max=5, date_min="01.01.2023"}
}))
--]]
function p.getSemanticQuery(args)
--local jsondata = p.defaultArg(args.jsondata, {})
--local schema = p.defaultArg(args.jsonschema, {})
local res = ""
local where = ""
local select = ""
local semantic_properties = p.getSemanticProperties(args)
--mw.logObject(semantic_properties)
for k,def in pairs(semantic_properties.definitions) do
-- see also: https://www.semantic-mediawiki.org/wiki/Help:Search_operators
local filter = p.defaultArgPath(def.schema_data, {'options', 'role', 'query', 'filter'}, 'eq')
local value = def.value
if def.schema_data.type == 'string' and (def.schema_data.format == 'number' or def.schema_data.format == 'date') then
if (filter == 'min') then value = "<" .. value
elseif (filter == 'max') then value = ">" .. value
else value = value end --exact match
elseif def.schema_data.type == 'string' then
value = "~*" .. value .. "*"
end
where = where .. "\n[[".. def.property .. "::" .. value .. "]]"
select = select .. "\n|?" .. def.property
if (def.schema_data.title ~= nil) then select = select .. "=" .. def.schema_data.title end
end
if (where ~= "") then res = "{{#ask:" .. res .. where .. select .. "}}" end
return {wikitext=res}
end
-- HELPERS
-- expands all $ref
--test: mw.logObject(p.expandJsonRef({json={items={test="value", ["$ref"]="/wiki/JsonSchema:Label?action=raw"}}}).json)
--test: mw.logObject(p.expandJsonRef({json={["$ref"]="/wiki/Category:Item?action=raw&slot=jsonschema"}}).json)
--test: mw.logObject(p.expandJsonRef({json={["$ref"]="/wiki/JsonSchema:Statement?action=raw"}}).json)
function p.expandJsonRef(args)
local json = p.defaultArg(args.json, {})
local debug = p.defaultArg(args.debug, false)
local refs = {}
for k,v in pairs(json) do
if (k == "$ref") then
-- e. g. "/wiki/JsonSchema:Label?action=raw" or "/wiki/Category:Entity?action=raw&slot=jsonschema"
if string.find(v, "#") then
if (debug) then mw.logObject("Skip relative reference") end
else
local uri = mw.uri.new(v)
local ref_title = mw.text.split(uri.path, "wiki/", true)[2]
local ref_slot = uri.query["slot"]
if (debug) then
if (ref_slot ~= nil) then mw.logObject("Ref found with title " .. ref_title .. " and slot " .. ref_slot)
else mw.logObject("Ref found with title " .. ref_title) end
end
local ref_json = p.loadJson({title=ref_title, slot=ref_slot}).json
refs[v] = ref_json
json[k] = nil
end
end
end
--mw.logObject(refs)
for k,v in pairs(refs) do
json = p.tableMerge(v, json)
end
for k,v in pairs(json) do
if type(v) == "table" then
json[k] = p.expandJsonRef({json=v}).json
end
end
local result = p.copy(json)
for k,v in pairs(json) do
if (k == "allOf") then
if (type(v) == "table" and v[1] == nil) then v = {v} end -- ensure array
for i,s in pairs(v) do
result = p.tableMerge(s, result)
if (debug) then mw.log("merge allOf with title " .. s["title"]) end
end
result[k] = nil
end
end
return {json=result}
end
function p.defaultArg(arg, default)
if (arg == nil) then
return default
else
return arg
end
end
-- returns the value of a table (dict) path or default, if the path is not defined
-- test: mw.logObject(p.defaultArgPath({some={defined={path="value"}}}, {"some", "defined", "path"}, "default_value"))
-- test: mw.logObject(p.defaultArgPath({some={defined={path="value"}}}, {"some", "undefined", "path"}, "default_value"))
function p.defaultArgPath(arg, path, default)
if (arg == nil) then
return default
elseif (path == nil) then
return arg
else
key = table.remove(path,1)
if (key == nil) then return arg end --end of path
return p.defaultArgPath(arg[key], path, default)
end
end
function p.splitString(inputstr, sep)
if sep == nil then
sep = ";"
end
local t={}
for str in string.gmatch(inputstr, "([^"..sep.."]+)") do
table.insert(t, str)
end
return t
end
--dumps a table to a string (replaced by mw.dumpObject())
function p.dump(o)
return mw.dumpObject(o)
end
--converts a literal to an table
function p.tablefy(o)
if (o == nil) then o = {} end
if (type(o) ~= 'table') then o = {o} end
return o
end
--true if the value is contained in the array (flat arrays only)
function p.tableContains (tab, val)
for index, value in ipairs(tab) do
if value == val then
return true
end
end
return false
end
--get the size of a table
function p.tableLength(t)
local count = 0
for _ in pairs(t) do count = count + 1 end
return count
end
--check if a variable is nil or an empty string or table
function p.nilOrEmpty(o)
if (o == nil) then return true
elseif (type(o) == 'string' and o == "") then return true
elseif (type(o) == 'table' and p.tableLength(o) == 0) then return true
else return false
end
end
-- merges t2 to t1
--test: mw.logObject(p.tableMerge({"string", test1="test1", subtable1={"test"}}, {"string2", test1="test2", test3="test4"}))
function p.tableMerge(t1, t2)
if (t1 == nil) then t1 = {} elseif (type(t1) ~= 'table') then t1 = {t1} end
if (t2 == nil) then t2 = {} elseif (type(t2) ~= 'table') then t2 = {t2} end
for k,v in pairs(t2) do
if type(v) == "table" then
if type(t1[k] or false) == "table" then
p.tableMerge(t1[k] or {}, t2[k] or {})
else
if type(k) == 'number' then table.insert(t1, v)
else t1[k] = v end
end
else
if type(k) == 'number' then table.insert(t1, v)
else t1[k] = v end
end
end
return t1
end
-- from https://stackoverflow.com/questions/640642/how-do-you-copy-a-lua-table-by-value
function p.copy(obj, seen)
if type(obj) ~= 'table' then return obj end
if seen and seen[obj] then return seen[obj] end
local s = seen or {}
local res = setmetatable({}, getmetatable(obj))
s[obj] = res
for k, v in pairs(obj) do res[p.copy(k, s)] = p.copy(v, s) end
return res
end
-- build normalized multilang label
function p.setNormalizedLabel(properties, use_fallbacks)
if (use_fallbacks == nil) then use_fallbacks = true end
if (properties['HasLabel'] ~= nil) then
labels = properties['HasLabel']
if(type(labels) ~= 'table') then labels = {labels} end
properties['HasNormalizedLabel'] = {}
for i, label in ipairs(labels) do
label_norm = p.splitString(label, '@')[1]:lower():gsub('[^%w]+','')
label_lang = "en"
if (p.splitString(label, '@')[2] ~= nil) then label_lang = p.splitString(label, '@')[2] end
table.insert(properties['HasNormalizedLabel'], label_norm .. "@" .. label_lang)
end
elseif (use_fallbacks and properties['HasName'] ~= nil) then -- fallback, assume English lang
labels = properties['HasName']
if(type(labels) ~= 'table') then labels = {labels} end
properties['HasNormalizedLabel'] = {}
for i, label in ipairs(labels) do
label_norm = label:lower():gsub('[^%w]+','')
table.insert(properties['HasNormalizedLabel'], label_norm .. "@en")
end
elseif (use_fallbacks and properties['Display title of'] ~= nil) then -- fallback, assume English lang
labels = properties['Display title of']
if(type(labels) ~= 'table') then labels = {labels} end
properties['HasNormalizedLabel'] = {}
for i, label in ipairs(labels) do
label_norm = label:lower():gsub('[^%w]+','')
table.insert(properties['HasNormalizedLabel'], label_norm .. "@en")
end
end
end
return p