diff --git a/data-wrapper/v1/csv.ini b/data-wrapper/v1/csv.ini deleted file mode 100644 index 069b718..0000000 --- a/data-wrapper/v1/csv.ini +++ /dev/null @@ -1,67 +0,0 @@ -# Entrypoint output format -mimeType = application/x-gzip -extension = tar.gz - -# OpenAPI Documentation - JSON format (dot notation) -post.operationId = post-v1-csv -post.summary = Transformation d'un fichier CSV en fichier corpus -post.description = Le fichier est transformé en fichier corpus exploitable par un web service asynchrone -post.tags.0 = data-wrapper -post.requestBody.content.text/csv.schema.type = string -post.requestBody.content.text/csv.schema.format = binary -post.requestBody.required = true -post.responses.default.description = Fichier corpus au format tar.gz -post.responses.default.content.application/x-gzip.schema.type = string -post.responses.default.content.application/x-gzip.schema.format = binary -post.parameters.0.description = Nom du champ à exploiter comme identifiant de colonne -post.parameters.0.in = query -post.parameters.0.name = id -post.parameters.0.schema.type = string -post.parameters.0.schema.default = id -post.parameters.0.required = false -post.parameters.1.description = Nom du champ à exploiter comme identifiant de ligne -post.parameters.1.in = query -post.parameters.1.name = value -post.parameters.1.schema.type = string -post.parameters.1.schema.default = value -post.parameters.1.required = false -post.parameters.2.description = chaque ligne est réduite à un object contenant 2 champs (id, value) -post.parameters.2.in = query -post.parameters.2.name = slim -post.parameters.2.schema.type = boolean -post.parameters.2.schema.default = true -post.parameters.2.required = false - -[env] -path = slim -value = env('slim').thru(x => (x === 'false' ? false : true)) - -[use] -plugin = basics - -[CSVParse] - -[CSVObject] - -[assign] -path = id -value = get(env('id', 'id')) -path = value -value = get(env('value', 'value')) - -[exchange] -value = self().thru(x => _.env(null, 'slim') ? _.pick(x, ['id', 'value']) : x) - -# in the hope that all the lines look the same -[singleton] -[singleton/validate] -path = value -rule = required - -[TARDump] -compress = true -manifest = fix({version: '1'}) -manifest = fix({generator: 'v1/csv'}) -manifest = fix({parameters: _.omit(_.env(), 'headers')}) -manifest = fix({hostAgent: _.get(_.env(), 'headers.host')}) -manifest = fix({userAgent: _.get(_.env(), 'headers.user-agent')}) diff --git a/data-wrapper/v1/fields/csv.ini b/data-wrapper/v1/fields/csv.ini deleted file mode 100644 index aa29059..0000000 --- a/data-wrapper/v1/fields/csv.ini +++ /dev/null @@ -1,41 +0,0 @@ -# Entrypoint output format -mimeType = application/json -extension = json - -# OpenAPI Documentation - JSON format (dot notation) -post.operationId = post-v1-fields-csv -post.description = Récupération des colonnes d'un fichier CSV -post.summary = Le fichier est analysé pour lister les colonnes utilisées -post.tags.0 = data-wrapper -post.requestBody.content.text/csv.schema.type = string -post.requestBody.content.text/csv.schema.format = binary -post.requestBody.required = true -post.responses.default.description = Liste des colonnes trouvées -post.responses.default.content.application/json.schema.$ref = #/components/schemas/JSONStream -post.responses.default.content.application/json.example.0.value = Title -post.responses.default.content.application/json.example.1.value = Keywords -post.parameters.0.description = Indenter le JSON résultant -post.parameters.0.in = query -post.parameters.0.name = indent -post.parameters.0.schema.type = boolean - -[use] -plugin = basics - -[CSVParse] - -[CSVObject] - -[shift] - -[exchange] -value = self().keys() - -[ungroup] - -[replace] -path = value -value = self() - -[dump] -indent = env('indent', false) diff --git a/data-wrapper/v1/istex-tar-gz.ini b/data-wrapper/v1/istex-tar-gz.ini deleted file mode 100644 index 0c01461..0000000 --- a/data-wrapper/v1/istex-tar-gz.ini +++ /dev/null @@ -1,64 +0,0 @@ -# Entrypoint output format -mimeType = application/x-gzip -extension = tar.gz - -# OpenAPI Documentation - JSON format (dot notation) -post.operationId = post-v1-tar-gz -post.summary = Transformation d'un fichier ISTEX (format tar.gz) en fichier corpus -post.description = Le fichier est transformé en fichier corpus exploitable par un web service asynchrone -post.tags.0 = data-wrapper -post.requestBody.content.application/x-gzip.schema.type = string -post.requestBody.content.application/x-gzip.schema.format = binary -post.requestBody.content.application/x-tar.schema.type = string -post.requestBody.content.application/x-tar.schema.format = binary -post.requestBody.required = true -post.responses.default.description = Fichier corpus au format tar.gz -post.responses.default.content.application/x-gzip.schema.type = string -post.responses.default.content.application/x-gzip.schema.format = binary -post.parameters.0.description = Nom du champ à exploiter contenant l'identifiant -post.parameters.0.in = query -post.parameters.0.name = id -post.parameters.0.schema.type = string -post.parameters.0.schema.default = ark.0 -post.parameters.0.required = false -post.parameters.1.description = Nom du champ à exploiter contenant la valeur -post.parameters.1.in = query -post.parameters.1.name = value -post.parameters.1.schema.type = string -post.parameters.1.schema.default = abstract -post.parameters.1.required = false -post.parameters.2.description = chaque objet est réduit à un object contenant 2 champs (id, value) -post.parameters.2.in = query -post.parameters.2.name = slim -post.parameters.2.schema.type = boolean -post.parameters.2.schema.default = true -post.parameters.2.required = false - -[env] -path = slim -value = env('slim').thru(x => (x === 'false' ? false : true)) - -[use] -plugin = basics - -[TARExtract] -compress = true -path = */*.json - -[assign] -path = id -value = get(env('id', 'ark.0')) - -path = value -value = get(env('value', 'abstract')) - -[exchange] -value = self().thru(x => _.env(null, 'slim') ? _.pick(x, ['id', 'value']) : x) - -[TARDump] -compress = true -manifest = fix({version: '1'}) -manifest = fix({generator: 'v1/istex-tar-gz'}) -manifest = fix({parameters: _.omit(_.env(), 'headers')}) -manifest = fix({hostAgent: _.get(_.env(), 'headers.host')}) -manifest = fix({userAgent: _.get(_.env(), 'headers.user-agent')}) diff --git a/data-wrapper/v1/new-persee-tei.xsl b/data-wrapper/v1/new-persee-tei.xsl deleted file mode 100644 index 69e9523..0000000 --- a/data-wrapper/v1/new-persee-tei.xsl +++ /dev/null @@ -1,57 +0,0 @@ - - - - - - - - - - - - - - - - - - <xsl:value-of - select="//tei:fileDesc/tei:titleStmt/tei:title"/> - - - - - - - - - - - - - - - - - - -

- -

-
- - - - - - - - - - - -
diff --git a/data-wrapper/v1/query-conditor.ini b/data-wrapper/v1/query-conditor.ini deleted file mode 100644 index a44ebe0..0000000 --- a/data-wrapper/v1/query-conditor.ini +++ /dev/null @@ -1,73 +0,0 @@ -# Entrypoint output format -mimeType = application/x-gzip -extension = tar.gz - -# OpenAPI Documentation - JSON format (dot notation) -post.operationId = post-v1-query-conditor -post.summary = Téléchargement des documents Conditor répondant à une requête -post.description = Le fichier en entrée contient une requête dont le résultat produira un fichier corpus exploitable par un web service asynchrone -post.tags.0 = data-wrapper -post.requestBody.content.text/plain.schema.type = string -post.requestBody.content.text/plain.schema.format = binary -post.requestBody.required = true -post.responses.default.description = Fichier corpus au format tar.gz -post.responses.default.content.application/x-gzip.schema.type = string -post.responses.default.content.application/x-gzip.schema.format = binary -post.parameters.0.description = Nom du champ à exploiter comme identifiant de colonne -post.parameters.0.in = query -post.parameters.0.name = id -post.parameters.0.schema.type = string -post.parameters.0.schema.default = business.sourceUidChain -post.parameters.0.required = false -post.parameters.1.description = Nom du champ à exploiter comme identifiant de ligne -post.parameters.1.in = query -post.parameters.1.name = value -post.parameters.1.schema.type = string -post.parameters.1.schema.default = title.en -post.parameters.1.required = false -post.parameters.2.description = chaque ligne est réduite à un object contenant 2 champs (id, value) -post.parameters.2.in = query -post.parameters.2.name = slim -post.parameters.2.schema.type = boolean -post.parameters.2.schema.default = true -post.parameters.2.required = false - -[env] -path = slim -value = env('slim').thru(x => (x === 'false' ? false : true)) - -[use] -plugin = basics -plugin = conditor - -[TXTConcat] - -[replace] -path = q -value = self().trim() - -[CORHALFetch] -url = https://corhal-api.inist.fr -retries = 3 -timeout = 60000 - -[assign] -path = id -value = get(env('id', 'business.sourceUidChain')) -path = value -value = get(env('value', 'title.en')) -value = self() - -[exchange] -value = self().thru(x => _.env(null, 'slim') ? _.pick(x, ['id', 'value']) : x) - -[TARDump] -compress = true -manifest = fix({version: '1'}) -manifest = fix({generator: 'v1/query-conditor'}) -manifest = fix({parameters: _.omit(_.env(), 'headers')}) -manifest = fix({hostAgent: _.get(_.env(), 'headers.host')}) -manifest = fix({userAgent: _.get(_.env(), 'headers.user-agent')}) - - - diff --git a/data-wrapper/v1/query-istex.ini b/data-wrapper/v1/query-istex.ini deleted file mode 100644 index 7ee7546..0000000 --- a/data-wrapper/v1/query-istex.ini +++ /dev/null @@ -1,74 +0,0 @@ -# Entrypoint output format -mimeType = application/x-gzip -extension = tar.gz - -# OpenAPI Documentation - JSON format (dot notation) -post.operationId = post-v1-query-istex -post.summary = Téléchargement des documents ISTEX répondant à une requete -post.description = Le fichier en entrée contient une requête dont le résultat produira un fichier corpus exploitable par un web service asynchrone -post.tags.0 = data-wrapper -post.requestBody.content.text/plain.schema.type = string -post.requestBody.content.text/plain.schema.format = binary -post.requestBody.required = true -post.responses.default.description = Fichier corpus au format tar.gz -post.responses.default.content.application/x-gzip.schema.type = string -post.responses.default.content.application/x-gzip.schema.format = binary -post.parameters.0.description = Nom du champ à exploiter comme identifiant de colonne -post.parameters.0.in = query -post.parameters.0.name = id -post.parameters.0.schema.type = string -post.parameters.0.schema.default = arkIstex -post.parameters.0.required = false -post.parameters.1.description = Nom du champ à exploiter comme identifiant de ligne -post.parameters.1.in = query -post.parameters.1.name = value -post.parameters.1.schema.type = string -post.parameters.1.schema.default = title -post.parameters.1.required = false -post.parameters.2.description = chaque ligne est réduite à un object contenant 2 champs (id, value) -post.parameters.2.in = query -post.parameters.2.name = slim -post.parameters.2.schema.type = boolean -post.parameters.2.schema.default = true -post.parameters.2.required = false - -[env] -path = slim -value = env('slim').thru(x => (x === 'false' ? false : true)) - -[use] -plugin = basics -plugin = istex - -[TXTConcat] - -[replace] -path = q -value = self().trim() - -[ISTEXScroll] -query = get('q') -field = * - -[ISTEXResult] - -[assign] -path = id -value = get(env('id', 'arkIstex')) -path = value -value = get(env('value', 'title')) -value = self() - -[exchange] -value = self().thru(x => _.env(null, 'slim') ? _.pick(x, ['id', 'value']) : x) - -[TARDump] -compress = true -manifest = fix({version: '1'}) -manifest = fix({generator: 'v1/query-istex'}) -manifest = fix({parameters: _.omit(_.env(), 'headers')}) -manifest = fix({hostAgent: _.get(_.env(), 'headers.host')}) -manifest = fix({userAgent: _.get(_.env(), 'headers.user-agent')}) - - - diff --git a/data-wrapper/v1/tar-tei2json.ini b/data-wrapper/v1/tar-tei2json.ini deleted file mode 100644 index 83489ea..0000000 --- a/data-wrapper/v1/tar-tei2json.ini +++ /dev/null @@ -1,43 +0,0 @@ -# Entrypoint output format -mimeType = application/x-gzip -extension = tar.gz - -# OpenAPI Documentation - JSON format (dot notation) -post.operationId = post-v1-tei2json -post.summary = Transformation d'un fichier TEI en fichier corpus -post.description = Le fichier est transformé en fichier corpus exploitable par un web service asynchrone, chaque document TEI est préalablement transformé en JSON -post.tags.0 = data-wrapper -post.requestBody.content.application/x-gzip.schema.type = string -post.requestBody.content.application/x-gzip.schema.format = binary -post.requestBody.content.application/x-tar.schema.type = string -post.requestBody.content.application/x-tar.schema.format = binary -post.requestBody.required = true -post.responses.default.description = Fichier corpus au format tar.gz -post.responses.default.content.application/x-gzip.schema.type = string -post.responses.default.content.application/x-gzip.schema.format = binary - -[use] -plugin = basics - -[TARExtract] -path = **/*.xml -compress = true -json = false - -[map] -path = value -[map/XMLParse] -separator = /tei:TEI -separator = /tei - -[replace] -path = fileName -value = get('id') - -path = fileContent -value = get('value.0') - -[TARDump] -compress = true -manifest = fix({version: '1'}) -manifest = fix({generator: 'v1/tar-tei2json'}) diff --git a/data-wrapper/v1/tar-tei2xml.ini b/data-wrapper/v1/tar-tei2xml.ini deleted file mode 100644 index 624bce9..0000000 --- a/data-wrapper/v1/tar-tei2xml.ini +++ /dev/null @@ -1,41 +0,0 @@ -# Entrypoint output format -mimeType = application/x-gzip -extension = tar.gz - -# OpenAPI Documentation - JSON format (dot notation) -post.operationId = post-v1-tar-tei2xml -post.summary = Transformation d'un fichier TEI en fichier corpus -post.description = Le fichier est transformé en fichier corpus exploitable par un web service asynchrone, chaque document TEI est préalablement simplifié en fichier XML minimal -post.tags.0 = data-wrapper -post.requestBody.content.application/x-gzip.schema.type = string -post.requestBody.content.application/x-gzip.schema.format = binary -post.requestBody.content.application/x-tar.schema.type = string -post.requestBody.content.application/x-tar.schema.format = binary -post.requestBody.required = true -post.responses.default.description = Fichier corpus au format tar.gz -post.responses.default.content.application/x-gzip.schema.type = string -post.responses.default.content.application/x-gzip.schema.format = binary - -[use] -plugin = basics -plugin = xslt - -[TARExtract] -path = **/*.xml -compress = true -json = false - -[map] -path = value -[map/xslt] -stylesheet = ./v1/new-persee-tei.xsl - -[exchange] -value = get('value.0') - -[TARDump] -compress = true -extension = xml -json = false -manifest = fix({version: '1'}) -manifest = fix({generator: 'v1/tar-tei2xml'})