Vorläufig ohne Zeitschriftenhefte #31 und nur mit einem Direktlink #25

This commit is contained in:
Felix Lohmeier 2021-03-19 16:12:58 +01:00
parent 8cd0b69f70
commit dd614a6e2d
3 changed files with 73 additions and 5 deletions

View File

@ -4,7 +4,7 @@ tasks:
main: main:
desc: miami ULB Münster desc: miami ULB Münster
vars: vars:
MINIMUM: 7300 # Mindestanzahl der zu erwartenden Datensätze MINIMUM: 6600 # Mindestanzahl der zu erwartenden Datensätze
PROJECT: '{{splitList ":" .TASK | first}}' # results in the task namespace, which is identical to the directory name PROJECT: '{{splitList ":" .TASK | first}}' # results in the task namespace, which is identical to the directory name
cmds: cmds:
- task: harvest - task: harvest
@ -65,6 +65,18 @@ tasks:
"$CLIENT" -P {{.PORT}} "{{.PROJECT}}" "$CLIENT" -P {{.PORT}} "{{.PROJECT}}"
--apply config/nur-mit-pdf.json --apply config/nur-mit-pdf.json
> {{.LOG}} > {{.LOG}}
- > # Separaten Download-Link entfernen, wenn nur eine Datei vorhanden ist
"$CLIENT" -P {{.PORT}} "{{.PROJECT}}"
--apply config/flocat.json
> {{.LOG}}
- > # Vorläufig Datensätze löschen, die mehr als einen Direktlink beinhalten https://github.com/opencultureconsulting/noah/issues/25
"$CLIENT" -P {{.PORT}} "{{.PROJECT}}"
--apply config/nur-ein-direktlink.json
> {{.LOG}}
- > # Vorläufig Zeitschriftenhefte löschen https://github.com/opencultureconsulting/noah/issues/31
"$CLIENT" -P {{.PORT}} "{{.PROJECT}}"
--apply config/keine-zeitschriftenhefte.json
> {{.LOG}}
- > # Datensätze mit "restriction on access" löschen - > # Datensätze mit "restriction on access" löschen
"$CLIENT" -P {{.PORT}} "{{.PROJECT}}" "$CLIENT" -P {{.PORT}} "{{.PROJECT}}"
--apply config/restriction.json --apply config/restriction.json
@ -85,10 +97,6 @@ tasks:
"$CLIENT" -P {{.PORT}} "{{.PROJECT}}" "$CLIENT" -P {{.PORT}} "{{.PROJECT}}"
--apply config/abstract.json --apply config/abstract.json
> {{.LOG}} > {{.LOG}}
- > # Separaten Download-Link entfernen, wenn nur eine Datei vorhanden ist
"$CLIENT" -P {{.PORT}} "{{.PROJECT}}"
--apply config/flocat.json
> {{.LOG}}
- > # mets:file - ID eindeutig machen, um Validierungsfehler zu vermeiden - > # mets:file - ID eindeutig machen, um Validierungsfehler zu vermeiden
"$CLIENT" -P {{.PORT}} "{{.PROJECT}}" "$CLIENT" -P {{.PORT}} "{{.PROJECT}}"
--apply config/file-id.json --apply config/file-id.json

View File

@ -0,0 +1,30 @@
[
{
"op": "core/row-removal",
"engineConfig": {
"facets": [
{
"type": "list",
"name": "mets:mets - mets:dmdSec - mets:mdWrap - mets:xmlData - mods:mods - mods:genre",
"expression": "value",
"columnName": "mets:mets - mets:dmdSec - mets:mdWrap - mets:xmlData - mods:mods - mods:genre",
"invert": false,
"omitBlank": false,
"omitError": false,
"selection": [
{
"v": {
"v": "PeriodicalPart",
"l": "PeriodicalPart"
}
}
],
"selectBlank": false,
"selectError": false
}
],
"mode": "record-based"
},
"description": "Remove rows"
}
]

View File

@ -0,0 +1,30 @@
[
{
"op": "core/row-removal",
"engineConfig": {
"facets": [
{
"type": "list",
"name": "mets:mets - mets:fileSec - mets:fileGrp - mets:file - mets:FLocat - xlink:href",
"expression": "grel:with(row.record.cells[columnName].value, x, and(x.length() == 1, x[0].toLowercase().contains('.pdf')))",
"columnName": "mets:mets - mets:fileSec - mets:fileGrp - mets:file - mets:FLocat - xlink:href",
"invert": false,
"omitBlank": false,
"omitError": false,
"selection": [
{
"v": {
"v": false,
"l": "false"
}
}
],
"selectBlank": false,
"selectError": false
}
],
"mode": "record-based"
},
"description": "Remove rows"
}
]