From 3da70f8553c496dd5810131f6f607e5b077f6b1d Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 6 May 2024 15:59:12 +0200 Subject: [PATCH 01/46] Create Deployment.yaml --- Deployment.yaml | 55 +++++++++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 55 insertions(+) create mode 100644 Deployment.yaml diff --git a/Deployment.yaml b/Deployment.yaml new file mode 100644 index 00000000..56ca6ee9 --- /dev/null +++ b/Deployment.yaml @@ -0,0 +1,55 @@ +--- +apiVersion: apps/v1 +kind: Deployment +metadata: + name: Kraftwerk +spec: + selector: + matchLabels: + app: Kraftwerk + template: + metadata: + labels: + app: Kraftwerk + spec: + automountServiceAccountToken: false + containers: + - name: Kraftwerk + image: gitlab-registry.insee.fr/sic/traitements-post-collecte/deployment/kraftwerk-deployment:latest + imagePullPolicy: Always + securityContext: + allowPrivilegeEscalation: false + capabilities: + drop: + - ALL + readOnlyRootFilesystem: true + runAsNonRoot: true + resources: + limits: + memory: "600Mi" + cpu: "500m" + requests: + memory: "1Mi" + cpu: "10m" + ports: + - containerPort: 8080 + livenessProbe: + failureThreshold: 3 + httpGet: + path: /actuator/health/liveness + port: http + scheme: HTTP + initialDelaySeconds: 15 + periodSeconds: 10 + successThreshold: 1 + timeoutSeconds: 1 + readinessProbe: + failureThreshold: 3 + httpGet: + path: /actuator/health/readiness + port: http + scheme: HTTP + initialDelaySeconds: 15 + periodSeconds: 10 + successThreshold: 1 + timeoutSeconds: 1 \ No newline at end of file From 39aff082aea51b6a3534fcdac6df3159ce6cc83d Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Tue, 7 May 2024 10:43:25 +0200 Subject: [PATCH 02/46] Add k8s manifests --- kraftwerk-api/pom.xml | 4 ++++ Deployment.yaml => manifests/Deployment.yaml | 10 ++++----- manifests/Ingress.yaml | 22 ++++++++++++++++++++ manifests/Service.yaml | 11 ++++++++++ 4 files changed, 42 insertions(+), 5 deletions(-) rename Deployment.yaml => manifests/Deployment.yaml (86%) create mode 100644 manifests/Ingress.yaml create mode 100644 manifests/Service.yaml diff --git a/kraftwerk-api/pom.xml b/kraftwerk-api/pom.xml index d63fb197..90df7e07 100644 --- a/kraftwerk-api/pom.xml +++ b/kraftwerk-api/pom.xml @@ -71,6 +71,10 @@ org.springframework.boot spring-boot-maven-plugin + + fr.insee.kraftwerk.api.KraftwerkApi + JAR + diff --git a/Deployment.yaml b/manifests/Deployment.yaml similarity index 86% rename from Deployment.yaml rename to manifests/Deployment.yaml index 56ca6ee9..aa487924 100644 --- a/Deployment.yaml +++ b/manifests/Deployment.yaml @@ -2,20 +2,20 @@ apiVersion: apps/v1 kind: Deployment metadata: - name: Kraftwerk + name: kraftwerk spec: selector: matchLabels: - app: Kraftwerk + app: kraftwerk template: metadata: labels: - app: Kraftwerk + app: kraftwerk spec: automountServiceAccountToken: false containers: - - name: Kraftwerk - image: gitlab-registry.insee.fr/sic/traitements-post-collecte/deployment/kraftwerk-deployment:latest + - name: kraftwerk + image: gitlab-registry.insee.fr:443/sic/traitements-post-collecte/deployment/kraftwerk-deployment:latest imagePullPolicy: Always securityContext: allowPrivilegeEscalation: false diff --git a/manifests/Ingress.yaml b/manifests/Ingress.yaml new file mode 100644 index 00000000..0f6f904a --- /dev/null +++ b/manifests/Ingress.yaml @@ -0,0 +1,22 @@ +apiVersion: networking.k8s.io/v1 +kind: Ingress +metadata: + name: kraftwerk-ingress + namespace: + labels: + name: kraftwerk +spec: + tls: + - hosts: + - api-transformation-post-collecte.dev.kube.insee.fr + rules: + - host: api-transformation-post-collecte.dev.kube.insee.fr + http: + paths: + - pathType: Prefix + path: "/" + backend: + service: + name: kraftwerk + port: + number: 8080 diff --git a/manifests/Service.yaml b/manifests/Service.yaml new file mode 100644 index 00000000..8049e1f5 --- /dev/null +++ b/manifests/Service.yaml @@ -0,0 +1,11 @@ +--- +apiVersion: v1 +kind: Service +metadata: + name: kraftwerk +spec: + selector: + app: kraftwerk + ports: + - port: 8080 + targetPort: 8080 \ No newline at end of file From 7a0824006462f437dcea0fba33e68b2a14ca4f8d Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Tue, 7 May 2024 16:14:12 +0200 Subject: [PATCH 03/46] Removed app-to-import jar from dockerfile --- Dockerfile | 2 +- kraftwerk-api/pom.xml | 1 - 2 files changed, 1 insertion(+), 2 deletions(-) diff --git a/Dockerfile b/Dockerfile index cc12cfc5..07a3570e 100644 --- a/Dockerfile +++ b/Dockerfile @@ -1,6 +1,6 @@ # Java 21 FROM gitlab-registry.insee.fr:443/kubernetes/images/run/jre:21.0.1_12-jre-jammy-rootless -COPY --chown=$JAVA_USER:$JAVA_USER Kraftwerk/kraftwerk-api/target/kraftwerk-api-*app-to-import.jar kraftwerk.jar +COPY --chown=$JAVA_USER:$JAVA_USER --exclude=*-app-to-import.jar Kraftwerk/kraftwerk-api/target/kraftwerk-api-*.jar kraftwerk.jar EXPOSE 8080 diff --git a/kraftwerk-api/pom.xml b/kraftwerk-api/pom.xml index 90df7e07..1ef31633 100644 --- a/kraftwerk-api/pom.xml +++ b/kraftwerk-api/pom.xml @@ -72,7 +72,6 @@ org.springframework.boot spring-boot-maven-plugin - fr.insee.kraftwerk.api.KraftwerkApi JAR From 21b39d559b9a0bc87e1fc809fbee9777ff449883 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Tue, 7 May 2024 16:31:24 +0200 Subject: [PATCH 04/46] Update Dockerfile --- Dockerfile | 4 +++- 1 file changed, 3 insertions(+), 1 deletion(-) diff --git a/Dockerfile b/Dockerfile index 07a3570e..dc305dab 100644 --- a/Dockerfile +++ b/Dockerfile @@ -1,6 +1,8 @@ # Java 21 FROM gitlab-registry.insee.fr:443/kubernetes/images/run/jre:21.0.1_12-jre-jammy-rootless -COPY --chown=$JAVA_USER:$JAVA_USER --exclude=*-app-to-import.jar Kraftwerk/kraftwerk-api/target/kraftwerk-api-*.jar kraftwerk.jar +RUN export VERSION_KRAFTWERK=$(mvn -f pom.xml help:evaluate -Dexpression=project.version -q -DforceStdout) + +COPY --chown=$JAVA_USER:$JAVA_USER --exclude=*-app-to-import.jar Kraftwerk/kraftwerk-api/target/kraftwerk-api-$VERSION_KRAFTWERK.jar kraftwerk.jar EXPOSE 8080 From 1455609185b211b07c7bb41cd37ed368326cfb9d Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Tue, 7 May 2024 16:31:47 +0200 Subject: [PATCH 05/46] Update Dockerfile --- Dockerfile | 3 +-- 1 file changed, 1 insertion(+), 2 deletions(-) diff --git a/Dockerfile b/Dockerfile index dc305dab..abfd0dcb 100644 --- a/Dockerfile +++ b/Dockerfile @@ -1,8 +1,7 @@ # Java 21 FROM gitlab-registry.insee.fr:443/kubernetes/images/run/jre:21.0.1_12-jre-jammy-rootless RUN export VERSION_KRAFTWERK=$(mvn -f pom.xml help:evaluate -Dexpression=project.version -q -DforceStdout) - -COPY --chown=$JAVA_USER:$JAVA_USER --exclude=*-app-to-import.jar Kraftwerk/kraftwerk-api/target/kraftwerk-api-$VERSION_KRAFTWERK.jar kraftwerk.jar +COPY --chown=$JAVA_USER:$JAVA_USER Kraftwerk/kraftwerk-api/target/kraftwerk-api-$VERSION_KRAFTWERK.jar kraftwerk.jar EXPOSE 8080 From 69db7f74e037d1bce0d0660b029a1d78f331a027 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Tue, 7 May 2024 16:56:32 +0200 Subject: [PATCH 06/46] Update Dockerfile --- Dockerfile | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/Dockerfile b/Dockerfile index abfd0dcb..1de00eb2 100644 --- a/Dockerfile +++ b/Dockerfile @@ -1,6 +1,6 @@ # Java 21 FROM gitlab-registry.insee.fr:443/kubernetes/images/run/jre:21.0.1_12-jre-jammy-rootless -RUN export VERSION_KRAFTWERK=$(mvn -f pom.xml help:evaluate -Dexpression=project.version -q -DforceStdout) +ARG VERSION_KRAFTWERK COPY --chown=$JAVA_USER:$JAVA_USER Kraftwerk/kraftwerk-api/target/kraftwerk-api-$VERSION_KRAFTWERK.jar kraftwerk.jar EXPOSE 8080 From d49117d78aa2fcd58632683ef8c8ad5b4d3c82ff Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 13 May 2024 10:01:59 +0200 Subject: [PATCH 07/46] Add actuators + add config map --- .../src/main/resources/application.properties | 10 ++++++++++ manifests/ConfigMapDV.yaml | 14 ++++++++++++++ manifests/Deployment.yaml | 9 ++++++--- manifests/Ingress.yaml | 2 +- manifests/Service.yaml | 2 +- pom.xml | 4 ++++ 6 files changed, 36 insertions(+), 5 deletions(-) create mode 100644 manifests/ConfigMapDV.yaml diff --git a/kraftwerk-api/src/main/resources/application.properties b/kraftwerk-api/src/main/resources/application.properties index 0185af9a..658a1a3d 100644 --- a/kraftwerk-api/src/main/resources/application.properties +++ b/kraftwerk-api/src/main/resources/application.properties @@ -20,3 +20,13 @@ fr.insee.postcollecte.csv.output.quote =" fr.insee.postcollecte.size-limit = 419430400 +#-------------------------------------------------------------------------- +# Actuator +# There are several ways to configure it : +# https://docs.spring.io/spring-boot/docs/3.0.0/reference/htmlsingle/#actuator.endpoints.exposing +#-------------------------------------------------------------------------- +management.health.probes.enabled=true +management.endpoint.health.show-details=always +#Global deactivation and activation endpoint by endpoint +#management.endpoints.enabled-by-default=false +#management.endpoint.info.enabled=true \ No newline at end of file diff --git a/manifests/ConfigMapDV.yaml b/manifests/ConfigMapDV.yaml new file mode 100644 index 00000000..d6fd84a7 --- /dev/null +++ b/manifests/ConfigMapDV.yaml @@ -0,0 +1,14 @@ +apiVersion: v1 +kind: ConfigMap +metadata: + name: kraftwerk-config-dv + namespace: default +data: + fr.insee.postcollecte.files: C:\\Users\\QDIBYS\\Documents\\Kraftwerk_folder + logging.level.root: INFO + logging.level.fr.insee.kraftwerk: INFO + logging.file.name: C:\\Users\\QDIBYS\\Documents\\Kraftwerk_folder\\log\\kraftwerk.log + logging.pattern.rolling-file-name: C:\\Users\\QDIBYS\\Documents\\Kraftwerk_folder\\log\\kraftwerk-%d{yyyy-MM-dd}.%i.log + fr.insee.postcollecte.genesis.api.url: http://api-reponses-enquetes.dev.kube.insee.fr + + server.port: 8080 \ No newline at end of file diff --git a/manifests/Deployment.yaml b/manifests/Deployment.yaml index aa487924..0b0a2383 100644 --- a/manifests/Deployment.yaml +++ b/manifests/Deployment.yaml @@ -2,7 +2,7 @@ apiVersion: apps/v1 kind: Deployment metadata: - name: kraftwerk + name: kraftwerk_deployment spec: selector: matchLabels: @@ -14,7 +14,7 @@ spec: spec: automountServiceAccountToken: false containers: - - name: kraftwerk + - name: kraftwerk_container image: gitlab-registry.insee.fr:443/sic/traitements-post-collecte/deployment/kraftwerk-deployment:latest imagePullPolicy: Always securityContext: @@ -52,4 +52,7 @@ spec: initialDelaySeconds: 15 periodSeconds: 10 successThreshold: 1 - timeoutSeconds: 1 \ No newline at end of file + timeoutSeconds: 1 + envFrom: + - configMapRef: + name: kraftwerk-config-dv \ No newline at end of file diff --git a/manifests/Ingress.yaml b/manifests/Ingress.yaml index 0f6f904a..df54594f 100644 --- a/manifests/Ingress.yaml +++ b/manifests/Ingress.yaml @@ -1,7 +1,7 @@ apiVersion: networking.k8s.io/v1 kind: Ingress metadata: - name: kraftwerk-ingress + name: kraftwerk_ingress namespace: labels: name: kraftwerk diff --git a/manifests/Service.yaml b/manifests/Service.yaml index 8049e1f5..bf9c8096 100644 --- a/manifests/Service.yaml +++ b/manifests/Service.yaml @@ -2,7 +2,7 @@ apiVersion: v1 kind: Service metadata: - name: kraftwerk + name: kraftwerk_service spec: selector: app: kraftwerk diff --git a/pom.xml b/pom.xml index aecc677d..9efdea8f 100644 --- a/pom.xml +++ b/pom.xml @@ -65,6 +65,10 @@ + + org.springframework.boot + spring-boot-starter-actuator + From 1adcc70575c81b8ee58fac864b389eedcccd8f2b Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 13 May 2024 14:03:44 +0200 Subject: [PATCH 08/46] Functionnal pod, only one --- manifests/ConfigMapDV.yaml | 9 ++++---- manifests/Deployment.yaml | 31 +++++++++++++++++++--------- manifests/Ingress.yaml | 6 +++--- manifests/PersistantVolumeClaim.yaml | 11 ++++++++++ manifests/Service.yaml | 2 +- 5 files changed, 40 insertions(+), 19 deletions(-) create mode 100644 manifests/PersistantVolumeClaim.yaml diff --git a/manifests/ConfigMapDV.yaml b/manifests/ConfigMapDV.yaml index d6fd84a7..2a601b33 100644 --- a/manifests/ConfigMapDV.yaml +++ b/manifests/ConfigMapDV.yaml @@ -2,13 +2,12 @@ apiVersion: v1 kind: ConfigMap metadata: name: kraftwerk-config-dv - namespace: default data: - fr.insee.postcollecte.files: C:\\Users\\QDIBYS\\Documents\\Kraftwerk_folder + fr.insee.postcollecte.files: /storage/data logging.level.root: INFO logging.level.fr.insee.kraftwerk: INFO - logging.file.name: C:\\Users\\QDIBYS\\Documents\\Kraftwerk_folder\\log\\kraftwerk.log - logging.pattern.rolling-file-name: C:\\Users\\QDIBYS\\Documents\\Kraftwerk_folder\\log\\kraftwerk-%d{yyyy-MM-dd}.%i.log + logging.file.name: /storage/log/kraftwerk.log + logging.pattern.rolling-file-name: /storage/log/kraftwerk-%d{yyyy-MM-dd}.%i.log fr.insee.postcollecte.genesis.api.url: http://api-reponses-enquetes.dev.kube.insee.fr - server.port: 8080 \ No newline at end of file + server.port: '8080' \ No newline at end of file diff --git a/manifests/Deployment.yaml b/manifests/Deployment.yaml index 0b0a2383..30a14a06 100644 --- a/manifests/Deployment.yaml +++ b/manifests/Deployment.yaml @@ -1,9 +1,9 @@ ---- apiVersion: apps/v1 kind: Deployment metadata: - name: kraftwerk_deployment + name: kraftwerk-deployment spec: + replicas: 1 #TODO Set to 3 with helm selector: matchLabels: app: kraftwerk @@ -14,7 +14,7 @@ spec: spec: automountServiceAccountToken: false containers: - - name: kraftwerk_container + - name: kraftwerk-container image: gitlab-registry.insee.fr:443/sic/traitements-post-collecte/deployment/kraftwerk-deployment:latest imagePullPolicy: Always securityContext: @@ -37,22 +37,33 @@ spec: failureThreshold: 3 httpGet: path: /actuator/health/liveness - port: http + port: 8080 scheme: HTTP - initialDelaySeconds: 15 - periodSeconds: 10 + initialDelaySeconds: 45 + periodSeconds: 60 successThreshold: 1 timeoutSeconds: 1 readinessProbe: failureThreshold: 3 httpGet: path: /actuator/health/readiness - port: http + port: 8080 scheme: HTTP - initialDelaySeconds: 15 - periodSeconds: 10 + initialDelaySeconds: 45 + periodSeconds: 60 successThreshold: 1 timeoutSeconds: 1 envFrom: - configMapRef: - name: kraftwerk-config-dv \ No newline at end of file + name: kraftwerk-config-dv + volumeMounts: + - mountPath: /tmp/ + name: kraftwerk-temp-volume + - mountPath: /storage/ + name: kraftwerk-volume + volumes: + - name: kraftwerk-temp-volume + emptyDir : {} + - name: kraftwerk-volume + persistentVolumeClaim: + claimName: kraftwerk-pvc \ No newline at end of file diff --git a/manifests/Ingress.yaml b/manifests/Ingress.yaml index df54594f..a6af9b37 100644 --- a/manifests/Ingress.yaml +++ b/manifests/Ingress.yaml @@ -1,10 +1,10 @@ apiVersion: networking.k8s.io/v1 kind: Ingress metadata: - name: kraftwerk_ingress + name: kraftwerk-ingress namespace: labels: - name: kraftwerk + name: kraftwerk-ingress spec: tls: - hosts: @@ -17,6 +17,6 @@ spec: path: "/" backend: service: - name: kraftwerk + name: kraftwerk-service port: number: 8080 diff --git a/manifests/PersistantVolumeClaim.yaml b/manifests/PersistantVolumeClaim.yaml new file mode 100644 index 00000000..8fd460ee --- /dev/null +++ b/manifests/PersistantVolumeClaim.yaml @@ -0,0 +1,11 @@ +apiVersion: v1 +kind: PersistentVolumeClaim +metadata: + name: kraftwerk-pvc +spec: + accessModes: + - ReadWriteOnce + resources: + requests: + storage: 1Gi + #TODO reclaimPolicy en recycle (pour éviter la suppression du PV) \ No newline at end of file diff --git a/manifests/Service.yaml b/manifests/Service.yaml index bf9c8096..fd3a84fa 100644 --- a/manifests/Service.yaml +++ b/manifests/Service.yaml @@ -2,7 +2,7 @@ apiVersion: v1 kind: Service metadata: - name: kraftwerk_service + name: kraftwerk-service spec: selector: app: kraftwerk From 96136a0d722f0d435ab2c49e8e918690ae9745c5 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 13 May 2024 15:32:52 +0200 Subject: [PATCH 09/46] Removed manifests (moved to argocd repo) --- manifests/ConfigMapDV.yaml | 13 ------ manifests/Deployment.yaml | 69 ---------------------------- manifests/Ingress.yaml | 22 --------- manifests/PersistantVolumeClaim.yaml | 11 ----- manifests/Service.yaml | 11 ----- 5 files changed, 126 deletions(-) delete mode 100644 manifests/ConfigMapDV.yaml delete mode 100644 manifests/Deployment.yaml delete mode 100644 manifests/Ingress.yaml delete mode 100644 manifests/PersistantVolumeClaim.yaml delete mode 100644 manifests/Service.yaml diff --git a/manifests/ConfigMapDV.yaml b/manifests/ConfigMapDV.yaml deleted file mode 100644 index 2a601b33..00000000 --- a/manifests/ConfigMapDV.yaml +++ /dev/null @@ -1,13 +0,0 @@ -apiVersion: v1 -kind: ConfigMap -metadata: - name: kraftwerk-config-dv -data: - fr.insee.postcollecte.files: /storage/data - logging.level.root: INFO - logging.level.fr.insee.kraftwerk: INFO - logging.file.name: /storage/log/kraftwerk.log - logging.pattern.rolling-file-name: /storage/log/kraftwerk-%d{yyyy-MM-dd}.%i.log - fr.insee.postcollecte.genesis.api.url: http://api-reponses-enquetes.dev.kube.insee.fr - - server.port: '8080' \ No newline at end of file diff --git a/manifests/Deployment.yaml b/manifests/Deployment.yaml deleted file mode 100644 index 30a14a06..00000000 --- a/manifests/Deployment.yaml +++ /dev/null @@ -1,69 +0,0 @@ -apiVersion: apps/v1 -kind: Deployment -metadata: - name: kraftwerk-deployment -spec: - replicas: 1 #TODO Set to 3 with helm - selector: - matchLabels: - app: kraftwerk - template: - metadata: - labels: - app: kraftwerk - spec: - automountServiceAccountToken: false - containers: - - name: kraftwerk-container - image: gitlab-registry.insee.fr:443/sic/traitements-post-collecte/deployment/kraftwerk-deployment:latest - imagePullPolicy: Always - securityContext: - allowPrivilegeEscalation: false - capabilities: - drop: - - ALL - readOnlyRootFilesystem: true - runAsNonRoot: true - resources: - limits: - memory: "600Mi" - cpu: "500m" - requests: - memory: "1Mi" - cpu: "10m" - ports: - - containerPort: 8080 - livenessProbe: - failureThreshold: 3 - httpGet: - path: /actuator/health/liveness - port: 8080 - scheme: HTTP - initialDelaySeconds: 45 - periodSeconds: 60 - successThreshold: 1 - timeoutSeconds: 1 - readinessProbe: - failureThreshold: 3 - httpGet: - path: /actuator/health/readiness - port: 8080 - scheme: HTTP - initialDelaySeconds: 45 - periodSeconds: 60 - successThreshold: 1 - timeoutSeconds: 1 - envFrom: - - configMapRef: - name: kraftwerk-config-dv - volumeMounts: - - mountPath: /tmp/ - name: kraftwerk-temp-volume - - mountPath: /storage/ - name: kraftwerk-volume - volumes: - - name: kraftwerk-temp-volume - emptyDir : {} - - name: kraftwerk-volume - persistentVolumeClaim: - claimName: kraftwerk-pvc \ No newline at end of file diff --git a/manifests/Ingress.yaml b/manifests/Ingress.yaml deleted file mode 100644 index a6af9b37..00000000 --- a/manifests/Ingress.yaml +++ /dev/null @@ -1,22 +0,0 @@ -apiVersion: networking.k8s.io/v1 -kind: Ingress -metadata: - name: kraftwerk-ingress - namespace: - labels: - name: kraftwerk-ingress -spec: - tls: - - hosts: - - api-transformation-post-collecte.dev.kube.insee.fr - rules: - - host: api-transformation-post-collecte.dev.kube.insee.fr - http: - paths: - - pathType: Prefix - path: "/" - backend: - service: - name: kraftwerk-service - port: - number: 8080 diff --git a/manifests/PersistantVolumeClaim.yaml b/manifests/PersistantVolumeClaim.yaml deleted file mode 100644 index 8fd460ee..00000000 --- a/manifests/PersistantVolumeClaim.yaml +++ /dev/null @@ -1,11 +0,0 @@ -apiVersion: v1 -kind: PersistentVolumeClaim -metadata: - name: kraftwerk-pvc -spec: - accessModes: - - ReadWriteOnce - resources: - requests: - storage: 1Gi - #TODO reclaimPolicy en recycle (pour éviter la suppression du PV) \ No newline at end of file diff --git a/manifests/Service.yaml b/manifests/Service.yaml deleted file mode 100644 index fd3a84fa..00000000 --- a/manifests/Service.yaml +++ /dev/null @@ -1,11 +0,0 @@ ---- -apiVersion: v1 -kind: Service -metadata: - name: kraftwerk-service -spec: - selector: - app: kraftwerk - ports: - - port: 8080 - targetPort: 8080 \ No newline at end of file From 408c7db2afa677f4c2dbbbf0807696fde6d4b811 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 14 Jun 2024 11:58:11 +0200 Subject: [PATCH 10/46] Add cli launch --- .../kraftwerk/api/batch/KraftwerkBatch.java | 91 +++++++++++++++++++ .../api/batch/KraftwerkServiceType.java | 11 +++ .../api/services/KraftwerkService.java | 2 +- 3 files changed, 103 insertions(+), 1 deletion(-) create mode 100644 kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java create mode 100644 kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkServiceType.java diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java new file mode 100644 index 00000000..e20357cf --- /dev/null +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java @@ -0,0 +1,91 @@ +package fr.insee.kraftwerk.api.batch; + +import fr.insee.kraftwerk.api.configuration.ConfigProperties; +import fr.insee.kraftwerk.api.process.MainProcessing; +import fr.insee.kraftwerk.api.process.MainProcessingGenesis; +import fr.insee.kraftwerk.api.services.KraftwerkService; +import lombok.extern.slf4j.Slf4j; +import org.springframework.beans.factory.annotation.Autowired; +import org.springframework.beans.factory.annotation.Value; +import org.springframework.boot.CommandLineRunner; +import org.springframework.stereotype.Component; + +@Component +@Slf4j +public class KraftwerkBatch implements CommandLineRunner { + @Autowired + public KraftwerkBatch(ConfigProperties configProperties) { + this.configProperties = configProperties; + } + + ConfigProperties configProperties; + + @Value("${fr.insee.postcollecte.files}") + protected String defaultDirectory; + + @Value("${fr.insee.postcollecte.size-limit}") + protected long limitSize; + + @Override + public void run(String... args) throws Exception{ + //If .jar launched with cli args + if (args.length > 0) { + log.info("Launching Kraftwerk using cli"); + + //Check arguments + checkArgs(args); + + //Parse arguments + KraftwerkServiceType kraftwerkServiceType = KraftwerkServiceType.valueOf(args[0]); + boolean archiveAtEnd = Boolean.parseBoolean(args[1]); + boolean withAllReportingData = Boolean.parseBoolean(args[2]); + String inDirectory = args[3]; + + //Kraftwerk service type related parameters + boolean fileByFile = kraftwerkServiceType == KraftwerkServiceType.FILE_BY_FILE; + boolean withDDI = kraftwerkServiceType != KraftwerkServiceType.LUNATIC_ONLY; + if(kraftwerkServiceType != KraftwerkServiceType.MAIN){ + withAllReportingData = false; + } + if(kraftwerkServiceType == KraftwerkServiceType.GENESIS){ + archiveAtEnd = false; + } + + + //Run kraftwerk + if(kraftwerkServiceType == KraftwerkServiceType.GENESIS){ + MainProcessingGenesis mainProcessingGenesis = new MainProcessingGenesis(configProperties); + mainProcessingGenesis.runMain(inDirectory); + }else{ + MainProcessing mainProcessing = new MainProcessing(inDirectory, fileByFile, withAllReportingData, withDDI, defaultDirectory, limitSize); + mainProcessing.runMain(); + } + + //Archive + if(Boolean.TRUE.equals(archiveAtEnd)){ + KraftwerkService kraftwerkService = new KraftwerkService(); + kraftwerkService.archive(inDirectory); + } + + System.exit(0); + } + } + + /** + * Throws a IllegalArgumentException if the arguments are not valid (ex: unparseable boolean) + * KraftwerkServiceType is already checked by valueOf + * @param args list of CLI arguments + * @throws IllegalArgumentException if invalid argument + */ + private static void checkArgs(String[] args) throws IllegalArgumentException{ + if(args.length != 4) { + throw new IllegalArgumentException("Invalid number of arguments ! Got %s instead of 4 !".formatted(args.length)); + } + if(!args[1].equals("true") && !args[1].equals("false")){ + throw new IllegalArgumentException("Invalid archiveAtEnd boolean argument !"); + } + if(!args[2].equals("true") && !args[2].equals("false")){ + throw new IllegalArgumentException("Invalid withAllReportingData boolean argument !"); + } + } +} diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkServiceType.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkServiceType.java new file mode 100644 index 00000000..031f6294 --- /dev/null +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkServiceType.java @@ -0,0 +1,11 @@ +package fr.insee.kraftwerk.api.batch; + +import lombok.AllArgsConstructor; + +@AllArgsConstructor +public enum KraftwerkServiceType { + MAIN, + LUNATIC_ONLY, + GENESIS, + FILE_BY_FILE; +} diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java index d0632af9..796519d8 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java @@ -47,7 +47,7 @@ public void initializeWithProperties() { controlInputSequence = new ControlInputSequence(defaultDirectory); } - protected ResponseEntity archive(String inDirectoryParam) { + public ResponseEntity archive(String inDirectoryParam) { Path inDirectory; try { inDirectory = controlInputSequence.getInDirectory(inDirectoryParam); From 823a756d71535d06abab2a0011f0925575b3c407 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 14 Jun 2024 13:13:54 +0200 Subject: [PATCH 11/46] Create batch dockerfile --- Dockerfile => docker/api/Dockerfile | 0 docker/batch/Dockerfile | 17 +++++++++++++++++ 2 files changed, 17 insertions(+) rename Dockerfile => docker/api/Dockerfile (100%) create mode 100644 docker/batch/Dockerfile diff --git a/Dockerfile b/docker/api/Dockerfile similarity index 100% rename from Dockerfile rename to docker/api/Dockerfile diff --git a/docker/batch/Dockerfile b/docker/batch/Dockerfile new file mode 100644 index 00000000..2ac68e4c --- /dev/null +++ b/docker/batch/Dockerfile @@ -0,0 +1,17 @@ +# Java 21 +FROM gitlab-registry.insee.fr:443/kubernetes/images/run/jre:21.0.1_12-jre-jammy-rootless +COPY --chown=$JAVA_USER:$JAVA_USER Kraftwerk/kraftwerk-api/target/kraftwerk-api-*app-to-import.jar kraftwerk.jar + +EXPOSE 8080 + +ARG serviceToUse +ARG archiveAtEnd +ARG withAllReportingData +ARG inDirectory + +ENV serviceToUse ${serviceToUse} +ENV archiveAtEnd ${archiveAtEnd} +ENV withAllReportingData ${withAllReportingData} +ENV inDirectory ${inDirectory} + +ENTRYPOINT ["java","-jar","/kraftwerk.jar", "$serviceToUse", "$archiveAtEnd","$withAllReportingData", "$inDirectory"] \ No newline at end of file From cddc8f3cbcd4453c217fc88fda59cea016b68e90 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 14 Jun 2024 13:16:21 +0200 Subject: [PATCH 12/46] Revert "Create batch dockerfile" This reverts commit 823a756d71535d06abab2a0011f0925575b3c407. --- docker/api/Dockerfile => Dockerfile | 0 docker/batch/Dockerfile | 17 ----------------- 2 files changed, 17 deletions(-) rename docker/api/Dockerfile => Dockerfile (100%) delete mode 100644 docker/batch/Dockerfile diff --git a/docker/api/Dockerfile b/Dockerfile similarity index 100% rename from docker/api/Dockerfile rename to Dockerfile diff --git a/docker/batch/Dockerfile b/docker/batch/Dockerfile deleted file mode 100644 index 2ac68e4c..00000000 --- a/docker/batch/Dockerfile +++ /dev/null @@ -1,17 +0,0 @@ -# Java 21 -FROM gitlab-registry.insee.fr:443/kubernetes/images/run/jre:21.0.1_12-jre-jammy-rootless -COPY --chown=$JAVA_USER:$JAVA_USER Kraftwerk/kraftwerk-api/target/kraftwerk-api-*app-to-import.jar kraftwerk.jar - -EXPOSE 8080 - -ARG serviceToUse -ARG archiveAtEnd -ARG withAllReportingData -ARG inDirectory - -ENV serviceToUse ${serviceToUse} -ENV archiveAtEnd ${archiveAtEnd} -ENV withAllReportingData ${withAllReportingData} -ENV inDirectory ${inDirectory} - -ENTRYPOINT ["java","-jar","/kraftwerk.jar", "$serviceToUse", "$archiveAtEnd","$withAllReportingData", "$inDirectory"] \ No newline at end of file From dbc06630142db30919f56128f4b27e942c4379e0 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 14 Jun 2024 13:18:12 +0200 Subject: [PATCH 13/46] Update Dockerfile --- Dockerfile | 1 + 1 file changed, 1 insertion(+) diff --git a/Dockerfile b/Dockerfile index cc12cfc5..fc905fb9 100644 --- a/Dockerfile +++ b/Dockerfile @@ -4,4 +4,5 @@ COPY --chown=$JAVA_USER:$JAVA_USER Kraftwerk/kraftwerk-api/target/kraftwerk-api- EXPOSE 8080 +#Docker run without additionnal params to use REST API mode, add batch parameters to use batch mode ENTRYPOINT ["java","-jar","/kraftwerk.jar"] \ No newline at end of file From feb421c519d429423b12d69bde826d8610b52e1e Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Wed, 19 Jun 2024 15:53:07 +0200 Subject: [PATCH 14/46] File utils to interface --- .../kraftwerk/api/batch/KraftwerkBatch.java | 7 +- .../kraftwerk/api/process/MainProcessing.java | 16 +++-- .../api/process/MainProcessingGenesis.java | 13 ++-- .../api/services/KraftwerkService.java | 14 ++-- .../kraftwerk/api/services/MainService.java | 24 +++++-- .../api/services/StepByStepService.java | 42 ++++++----- .../kraftwerk/core/inputs/UserInputs.java | 5 +- .../kraftwerk/core/inputs/UserInputsFile.java | 24 +++---- .../core/inputs/UserInputsGenesis.java | 10 +-- .../kraftwerk/core/outputs/OutputFiles.java | 4 +- .../BuildBindingsSequenceGenesis.java | 10 +-- .../core/sequence/ControlInputSequence.java | 5 +- .../core/sequence/MultimodalSequence.java | 12 ++-- .../core/sequence/UnimodalSequence.java | 14 ++-- .../sequence/VtlReaderWriterSequence.java | 4 +- .../core/sequence/WriterSequence.java | 4 +- .../{FileUtils.java => FileSystemImpl.java} | 72 ++++++------------- .../core/utils/FileUtilsInterface.java | 51 +++++++++++++ .../kraftwerk/core/utils/TextFileWriter.java | 8 +-- .../kraftwerk/core/utils/XMLSplitter.java | 2 +- .../insee/kraftwerk/core/vtl/VtlExecute.java | 4 +- .../core/inputs/UserInputsFileTest.java | 20 +++--- .../core/inputs/UserInputsGenesisTest.java | 3 +- .../core/outputs/CsvOutputFilesTest.java | 6 +- .../core/outputs/CsvTableWriterTest.java | 4 +- .../core/outputs/ParquetOutputFilesTest.java | 28 ++------ .../sequence/BuildBindingsSequenceTest.java | 8 ++- ...UtilsTest.java => FileSystemImplTest.java} | 25 ++++--- .../kraftwerk/core/utils/XMLSplitterTest.java | 8 ++- .../functional_tests/MainDefinitions.java | 30 ++++---- .../functional_tests/ParadataDefinitions.java | 5 +- 31 files changed, 272 insertions(+), 210 deletions(-) rename kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/{FileUtils.java => FileSystemImpl.java} (70%) create mode 100644 kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileUtilsInterface.java rename kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/{FileUtilsTest.java => FileSystemImplTest.java} (78%) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java index e20357cf..2b363615 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java @@ -4,6 +4,7 @@ import fr.insee.kraftwerk.api.process.MainProcessing; import fr.insee.kraftwerk.api.process.MainProcessingGenesis; import fr.insee.kraftwerk.api.services.KraftwerkService; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; import lombok.extern.slf4j.Slf4j; import org.springframework.beans.factory.annotation.Autowired; import org.springframework.beans.factory.annotation.Value; @@ -54,17 +55,17 @@ public void run(String... args) throws Exception{ //Run kraftwerk if(kraftwerkServiceType == KraftwerkServiceType.GENESIS){ - MainProcessingGenesis mainProcessingGenesis = new MainProcessingGenesis(configProperties); + MainProcessingGenesis mainProcessingGenesis = new MainProcessingGenesis(configProperties, new FileSystemImpl()); mainProcessingGenesis.runMain(inDirectory); }else{ - MainProcessing mainProcessing = new MainProcessing(inDirectory, fileByFile, withAllReportingData, withDDI, defaultDirectory, limitSize); + MainProcessing mainProcessing = new MainProcessing(inDirectory, fileByFile, withAllReportingData, withDDI, defaultDirectory, limitSize, new FileSystemImpl()); mainProcessing.runMain(); } //Archive if(Boolean.TRUE.equals(archiveAtEnd)){ KraftwerkService kraftwerkService = new KraftwerkService(); - kraftwerkService.archive(inDirectory); + kraftwerkService.archive(inDirectory, new FileSystemImpl()); } System.exit(0); diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java index 600459e6..133abdf4 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java @@ -7,6 +7,7 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.metadata.MetadataUtils; import fr.insee.kraftwerk.core.sequence.*; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.kraftwerk.core.utils.log.KraftwerkExecutionLog; import fr.insee.kraftwerk.core.vtl.VtlBindings; @@ -45,6 +46,7 @@ public class MainProcessing { private KraftwerkExecutionLog kraftwerkExecutionLog; private List errors = new ArrayList<>(); private LocalDateTime executionDateTime; + private FileUtilsInterface fileUtilsInterface; /** * Map by mode @@ -54,7 +56,7 @@ public class MainProcessing { private final long limitSize; - public MainProcessing(String inDirectoryParam, boolean fileByFile,boolean withAllReportingData,boolean withDDI, String defaultDirectory, long limitSize) { + public MainProcessing(String inDirectoryParam, boolean fileByFile,boolean withAllReportingData,boolean withDDI, String defaultDirectory, long limitSize, FileUtilsInterface fileUtilsInterface) { super(); this.inDirectoryParam = inDirectoryParam; this.fileByFile = fileByFile; @@ -62,9 +64,10 @@ public MainProcessing(String inDirectoryParam, boolean fileByFile,boolean withAl this.withDDI=withDDI; this.limitSize = limitSize; controlInputSequence = new ControlInputSequence(defaultDirectory); + this.fileUtilsInterface = fileUtilsInterface; } - public MainProcessing(String inDirectoryParam, boolean fileByFile, String defaultDirectory, long limitSize) { + public MainProcessing(String inDirectoryParam, boolean fileByFile, String defaultDirectory, long limitSize, FileUtilsInterface fileUtilsInterface) { super(); this.inDirectoryParam = inDirectoryParam; this.fileByFile = fileByFile; @@ -72,6 +75,7 @@ public MainProcessing(String inDirectoryParam, boolean fileByFile, String defaul this.withDDI=true; this.limitSize = limitSize; controlInputSequence = new ControlInputSequence(defaultDirectory); + this.fileUtilsInterface = fileUtilsInterface; } @@ -104,7 +108,7 @@ public void init() throws KraftwerkException { String campaignName = inDirectory.getFileName().toString(); log.info("Kraftwerk main service started for campaign: " + campaignName); - userInputsFile = controlInputSequence.getUserInputs(inDirectory); + userInputsFile = controlInputSequence.getUserInputs(inDirectory, fileUtilsInterface); if (withDDI) metadataModels = MetadataUtils.getMetadata(userInputsFile.getModeInputsMap()); if (!withDDI) metadataModels = MetadataUtils.getMetadataFromLunatic(userInputsFile.getModeInputsMap()); @@ -131,14 +135,14 @@ private void unimodalProcess() throws KraftwerkException { MetadataModel metadataForMode = metadataModels.get(dataMode); buildBindingsSequence.buildVtlBindings(userInputsFile, dataMode, vtlBindings, metadataForMode, withDDI, kraftwerkExecutionLog); UnimodalSequence unimodal = new UnimodalSequence(); - unimodal.applyUnimodalSequence(userInputsFile, dataMode, vtlBindings, errors, metadataModels); + unimodal.applyUnimodalSequence(userInputsFile, dataMode, vtlBindings, errors, metadataModels, fileUtilsInterface); } } /* Step 3 : multimodal VTL data processing */ private void multimodalProcess() { MultimodalSequence multimodalSequence = new MultimodalSequence(); - multimodalSequence.multimodalProcessing(userInputsFile, vtlBindings, errors, metadataModels); + multimodalSequence.multimodalProcessing(userInputsFile, vtlBindings, errors, metadataModels, fileUtilsInterface); } /* Step 4 : Write output files */ @@ -161,7 +165,7 @@ private static List getUserInputsFile(UserInputsFile source) thr for (String dataMode : source.getModeInputsMap().keySet()) { List dataFiles = getFilesToProcess(source, dataMode); for (Path dataFile : dataFiles) { - UserInputsFile currentFileInputs = new UserInputsFile(source.getUserInputFile(),source.getUserInputFile().getParent()); + UserInputsFile currentFileInputs = new UserInputsFile(source.getUserInputFile(),source.getUserInputFile().getParent(), source.getFileUtilsInterface()); currentFileInputs.setVtlReconciliationFile(source.getVtlReconciliationFile()); currentFileInputs.setVtlInformationLevelsFile(source.getVtlInformationLevelsFile()); currentFileInputs.setVtlTransformationsFile(source.getVtlTransformationsFile()); diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java index 9f605154..a15c0702 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java @@ -15,6 +15,7 @@ import fr.insee.kraftwerk.core.sequence.MultimodalSequence; import fr.insee.kraftwerk.core.sequence.UnimodalSequence; import fr.insee.kraftwerk.core.sequence.WriterSequence; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.Getter; @@ -43,6 +44,7 @@ public class MainProcessingGenesis { @Getter private UserInputsGenesis userInputs; private LocalDateTime executionDateTime; + private FileUtilsInterface fileUtilsInterface; /* SPECIFIC VARIABLES */ @Getter @@ -55,8 +57,9 @@ public class MainProcessingGenesis { private GenesisClient client; - public MainProcessingGenesis(ConfigProperties config) { + public MainProcessingGenesis(ConfigProperties config, FileUtilsInterface fileUtilsInterface) { this.client = new GenesisClient(new RestTemplateBuilder(), config); + this.fileUtilsInterface = fileUtilsInterface; } public void init(String idCampaign) throws KraftwerkException, IOException { @@ -65,7 +68,7 @@ public void init(String idCampaign) throws KraftwerkException, IOException { inDirectory = controlInputSequenceGenesis.getInDirectory(idCampaign); //First we check the modes present in database for the given questionnaire //We build userInputs for the given questionnaire - userInputs = new UserInputsGenesis(controlInputSequenceGenesis.isHasConfigFile(), inDirectory, client.getModes(idCampaign)); + userInputs = new UserInputsGenesis(controlInputSequenceGenesis.isHasConfigFile(), inDirectory, client.getModes(idCampaign), fileUtilsInterface); if (!userInputs.getModes().isEmpty()) { metadataModels = MetadataUtilsGenesis.getMetadata(userInputs.getModeInputsMap()); } else { @@ -99,16 +102,16 @@ public void runMain(String idCampaign) throws KraftwerkException, IOException { private void unimodalProcess(List suLatest) throws NullException { BuildBindingsSequenceGenesis buildBindingsSequenceGenesis = new BuildBindingsSequenceGenesis(); for (String dataMode : userInputs.getModeInputsMap().keySet()) { - buildBindingsSequenceGenesis.buildVtlBindings(dataMode, vtlBindings, metadataModels, suLatest, inDirectory); + buildBindingsSequenceGenesis.buildVtlBindings(dataMode, vtlBindings, metadataModels, suLatest, inDirectory, fileUtilsInterface); UnimodalSequence unimodal = new UnimodalSequence(); - unimodal.applyUnimodalSequence(userInputs, dataMode, vtlBindings, errors, metadataModels); + unimodal.applyUnimodalSequence(userInputs, dataMode, vtlBindings, errors, metadataModels, fileUtilsInterface); } } /* Step 3 : multimodal VTL data processing */ private void multimodalProcess() { MultimodalSequence multimodalSequence = new MultimodalSequence(); - multimodalSequence.multimodalProcessing(userInputs, vtlBindings, errors, metadataModels); + multimodalSequence.multimodalProcessing(userInputs, vtlBindings, errors, metadataModels, fileUtilsInterface); } /* Step 4 : Write output files */ diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java index 796519d8..ec7126b0 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java @@ -4,7 +4,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.sequence.ControlInputSequence; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import io.swagger.v3.oas.annotations.responses.ApiResponse; import io.swagger.v3.oas.annotations.responses.ApiResponses; import jakarta.annotation.PostConstruct; @@ -41,13 +41,15 @@ public class KraftwerkService { @PostConstruct public void initializeWithProperties() { + + if (StringUtils.isNotEmpty(csvOutputsQuoteChar)) { Constants.setCsvOutputQuoteChar(csvOutputsQuoteChar.trim().charAt(0)); } controlInputSequence = new ControlInputSequence(defaultDirectory); } - public ResponseEntity archive(String inDirectoryParam) { + public ResponseEntity archive(String inDirectoryParam, FileUtilsInterface fileUtilsInterface) { Path inDirectory; try { inDirectory = controlInputSequence.getInDirectory(inDirectoryParam); @@ -56,19 +58,19 @@ public ResponseEntity archive(String inDirectoryParam) { } /* Step 4.3 : move kraftwerk.json to a secondary folder */ - FileUtils.renameInputFile(inDirectory); + fileUtilsInterface.renameInputFile(inDirectory); /* Step 4.4 : move differential data to a secondary folder */ try { - FileUtils.archiveInputFiles(controlInputSequence.getUserInputs(inDirectory)); + fileUtilsInterface.archiveInputFiles(controlInputSequence.getUserInputs(inDirectory, fileUtilsInterface)); } catch (KraftwerkException e) { return ResponseEntity.status(e.getStatus()).body(e.getMessage()); } //delete temp directory - Path tempOutputPath = FileUtils.transformToTemp(inDirectory); + Path tempOutputPath = FileUtilsInterface.transformToTemp(inDirectory); try { - FileUtils.deleteDirectory(tempOutputPath); + fileUtilsInterface.deleteDirectory(tempOutputPath); } catch (KraftwerkException e) { return ResponseEntity.status(e.getStatus()).body(e.getMessage()); } diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java index 07569e29..c8670742 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java @@ -6,6 +6,8 @@ import fr.insee.kraftwerk.api.process.MainProcessingGenesis; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.sequence.ControlInputSequenceGenesis; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import io.swagger.v3.oas.annotations.Operation; import io.swagger.v3.oas.annotations.Parameter; import io.swagger.v3.oas.annotations.tags.Tag; @@ -40,7 +42,9 @@ public ResponseEntity mainService( ) { boolean fileByFile = false; boolean withDDI = true; - MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize); + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + + MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize, fileUtilsInterface); try { mp.runMain(); } catch (KraftwerkException e) { @@ -48,7 +52,7 @@ public ResponseEntity mainService( } /* Step 4.3- 4.4 : Archive */ - if (Boolean.TRUE.equals(archiveAtEnd)) archive(inDirectoryParam); + if (Boolean.TRUE.equals(archiveAtEnd)) archive(inDirectoryParam,fileUtilsInterface); return ResponseEntity.ok(inDirectoryParam); } @@ -62,14 +66,16 @@ public ResponseEntity mainFileByFile( boolean fileByFile = true; boolean withAllReportingData = false; boolean withDDI = true; - MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize); + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + + MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize, fileUtilsInterface); try { mp.runMain(); } catch (KraftwerkException e) { return ResponseEntity.status(e.getStatus()).body(e.getMessage()); } /* Step 4.3- 4.4 : Archive */ - if (Boolean.TRUE.equals(archiveAtEnd)) archive(inDirectoryParam); + if (Boolean.TRUE.equals(archiveAtEnd)) archive(inDirectoryParam, fileUtilsInterface); return ResponseEntity.ok(inDirectoryParam); } @@ -83,14 +89,16 @@ public ResponseEntity mainLunaticOnly( boolean withDDI = false; boolean fileByFile = false; boolean withAllReportingData = false; - MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize); + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + + MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize, fileUtilsInterface); try { mp.runMain(); } catch (KraftwerkException e) { return ResponseEntity.status(e.getStatus()).body(e.getMessage()); } /* Step 4.3- 4.4 : Archive */ - if (Boolean.TRUE.equals(archiveAtEnd)) archive(inDirectoryParam); + if (Boolean.TRUE.equals(archiveAtEnd)) archive(inDirectoryParam, fileUtilsInterface); return ResponseEntity.ok(inDirectoryParam); } @@ -99,7 +107,9 @@ public ResponseEntity mainLunaticOnly( @Operation(operationId = "mainGenesis", summary = "${summary.mainGenesis}", description = "${description.mainGenesis}") public ResponseEntity mainGenesis( @Parameter(description = "${param.idCampaign}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String idCampaign) { - MainProcessingGenesis mpGenesis = new MainProcessingGenesis(configProperties); + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + MainProcessingGenesis mpGenesis = new MainProcessingGenesis(configProperties, fileUtilsInterface); + try { mpGenesis.setControlInputSequenceGenesis(new ControlInputSequenceGenesis(defaultDirectory)); mpGenesis.runMain(idCampaign); diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java index 8db35942..c3591a93 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java @@ -9,7 +9,8 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.metadata.MetadataUtils; import fr.insee.kraftwerk.core.sequence.*; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.kraftwerk.core.vtl.VtlBindings; import io.swagger.v3.oas.annotations.Operation; @@ -40,7 +41,9 @@ public ResponseEntity buildVtlBindings( //Read data files boolean fileByFile = false; boolean withDDI = true; - MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize); + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + + MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize, fileUtilsInterface); try { mp.init(); } catch (KraftwerkException e) { @@ -77,7 +80,9 @@ public ResponseEntity buildVtlBindingsByDataMode( //Read data files boolean fileByFile = false; boolean withDDI = true; - MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize); + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + + MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize, fileUtilsInterface); try { mp.init(); } catch (KraftwerkException e) { @@ -107,6 +112,8 @@ public ResponseEntity unimodalProcessing( @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam, @Parameter(description = "${param.dataMode}", required = true) @RequestParam String dataMode ) { + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + //Read data in JSON file Path inDirectory; try { @@ -116,7 +123,7 @@ public ResponseEntity unimodalProcessing( } UserInputsFile userInputsFile; try { - userInputsFile = controlInputSequence.getUserInputs(inDirectory); + userInputsFile = controlInputSequence.getUserInputs(inDirectory, fileUtilsInterface); } catch (KraftwerkException e) { return ResponseEntity.status(e.getStatus()).body(e.getMessage()); } @@ -124,13 +131,13 @@ public ResponseEntity unimodalProcessing( List errors = new ArrayList<>(); VtlReaderWriterSequence vtlReaderSequence = new VtlReaderWriterSequence(); - vtlReaderSequence.readDataset(FileUtils.transformToTemp(inDirectory).toString(),dataMode, StepEnum.BUILD_BINDINGS, vtlBindings); + vtlReaderSequence.readDataset(FileUtilsInterface.transformToTemp(inDirectory).toString(),dataMode, StepEnum.BUILD_BINDINGS, vtlBindings); Map metadataModelMap = MetadataUtils.getMetadata(userInputsFile.getModeInputsMap()); //Process UnimodalSequence unimodal = new UnimodalSequence(); - unimodal.applyUnimodalSequence(userInputsFile, dataMode, vtlBindings, errors, metadataModelMap); + unimodal.applyUnimodalSequence(userInputsFile, dataMode, vtlBindings, errors, metadataModelMap, fileUtilsInterface); //Write technical outputs VtlReaderWriterSequence vtlWriterSequence = new VtlReaderWriterSequence(); @@ -148,6 +155,8 @@ public ResponseEntity unimodalProcessing( public ResponseEntity multimodalProcessing( @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam ) { + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + //Read data in JSON file Path inDirectory; try { @@ -157,7 +166,7 @@ public ResponseEntity multimodalProcessing( } UserInputsFile userInputsFile; try { - userInputsFile = controlInputSequence.getUserInputs(inDirectory); + userInputsFile = controlInputSequence.getUserInputs(inDirectory, fileUtilsInterface); } catch (KraftwerkException e) { return ResponseEntity.status(e.getStatus()).body(e.getMessage()); } @@ -169,14 +178,14 @@ public ResponseEntity multimodalProcessing( //Test VtlBindings vtlBindings = new VtlBindings(); for (String dataMode : userInputsFile.getModeInputsMap().keySet()) { - vtlReaderWriterSequence.readDataset(FileUtils.transformToTemp(inDirectory).toString(),dataMode, StepEnum.UNIMODAL_PROCESSING, vtlBindings); + vtlReaderWriterSequence.readDataset(FileUtilsInterface.transformToTemp(inDirectory).toString(),dataMode, StepEnum.UNIMODAL_PROCESSING, vtlBindings); } Map metadataModelMap = MetadataUtils.getMetadata(userInputsFile.getModeInputsMap()); //Process MultimodalSequence multimodalSequence = new MultimodalSequence(); - multimodalSequence.multimodalProcessing(userInputsFile, vtlBindings, errors, metadataModelMap); + multimodalSequence.multimodalProcessing(userInputsFile, vtlBindings, errors, metadataModelMap, fileUtilsInterface); //Write technical fils for (String datasetName : vtlBindings.getDatasetNames()) { @@ -194,6 +203,8 @@ public ResponseEntity multimodalProcessing( public ResponseEntity writeOutputFiles( @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam ) throws KraftwerkException { + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + Path inDirectory; try { inDirectory = controlInputSequence.getInDirectory(inDirectoryParam); @@ -204,8 +215,8 @@ public ResponseEntity writeOutputFiles( VtlBindings vtlBindings = new VtlBindings(); List errors = new ArrayList<>(); // Read all bindings necessary to produce output - String path = FileUtils.transformToTemp(inDirectory).toString(); - List fileNames = FileUtils.listFiles(path); + String path = FileUtilsInterface.transformToTemp(inDirectory).toString(); + List fileNames = fileUtilsInterface.listFiles(path); fileNames = fileNames.stream().filter(name -> name.endsWith(StepEnum.MULTIMODAL_PROCESSING.getStepLabel()+JSON)).toList(); for (String name : fileNames){ String pathBindings = path + File.separator + name; @@ -216,7 +227,7 @@ public ResponseEntity writeOutputFiles( WriterSequence writerSequence = new WriterSequence(); UserInputsFile userInputsFile; try { - userInputsFile = controlInputSequence.getUserInputs(inDirectory); + userInputsFile = controlInputSequence.getUserInputs(inDirectory, fileUtilsInterface); } catch (KraftwerkException e) { return ResponseEntity.status(e.getStatus()).body(e.getMessage()); } @@ -227,14 +238,13 @@ public ResponseEntity writeOutputFiles( } - @PutMapping(value = "/archive") @Operation(operationId = "archive", summary = "${summary.archive}", description = "${description.archive}") public ResponseEntity archiveService( - @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam) - { - return archive(inDirectoryParam); + @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam) { + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + return archive(inDirectoryParam, fileUtilsInterface); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputs.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputs.java index 741f90ff..99fde59a 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputs.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputs.java @@ -1,5 +1,6 @@ package fr.insee.kraftwerk.core.inputs; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import lombok.Getter; import lombok.Setter; @@ -17,9 +18,11 @@ public class UserInputs { protected Path vtlTransformationsFile; protected Path vtlInformationLevelsFile; protected String multimodeDatasetName; + protected FileUtilsInterface fileUtilsInterface; - public UserInputs(Path inputDirectory) { + public UserInputs(Path inputDirectory, FileUtilsInterface fileUtilsInterface) { this.inputDirectory = inputDirectory; + this.fileUtilsInterface = fileUtilsInterface; } public ModeInputs getModeInputs(String modeName) { return modeInputsMap.get(modeName); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java index 34c3a2fe..9a280407 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java @@ -4,7 +4,7 @@ import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.exceptions.MissingMandatoryFieldException; import fr.insee.kraftwerk.core.exceptions.UnknownDataFormatException; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.JsonFileReader; import lombok.Getter; import lombok.Setter; @@ -28,8 +28,8 @@ public class UserInputsFile extends UserInputs { private final Set mandatoryFields = Set.of("survey_data", "data_mode", "data_file", "data_format", "multimode_dataset_name"); - public UserInputsFile(Path userConfigFile, Path inputDirectory) throws KraftwerkException { - super(inputDirectory); + public UserInputsFile(Path userConfigFile, Path inputDirectory, FileUtilsInterface fileUtilsInterface) throws KraftwerkException { + super(inputDirectory,fileUtilsInterface); this.userInputFile = userConfigFile; readUserInputs(); } @@ -46,13 +46,13 @@ private void readUserInputs() throws UnknownDataFormatException, MissingMandator String dataFolder = readField(fileNode, "data_file"); String paradataFolder = readField(fileNode, "paradata_folder"); String reportingFolder = readField(fileNode, "reporting_data_file"); - Path dataPath = (new File(dataFolder).exists()) ? convertToUserPath(dataFolder) : FileUtils.convertToPath(dataFolder,inputDirectory); - URL ddiFile = FileUtils.convertToUrl(readField(fileNode, "DDI_file"),inputDirectory); - Path lunaticFile = FileUtils.convertToPath(readField(fileNode, "lunatic_file"),inputDirectory); + Path dataPath = (new File(dataFolder).exists()) ? convertToUserPath(dataFolder) : fileUtilsInterface.convertToPath(dataFolder,inputDirectory); + URL ddiFile = fileUtilsInterface.convertToUrl(readField(fileNode, "DDI_file"),inputDirectory); + Path lunaticFile = fileUtilsInterface.convertToPath(readField(fileNode, "lunatic_file"),inputDirectory); String dataFormat = readField(fileNode, "data_format"); - Path paradataPath = (paradataFolder != null && new File(paradataFolder).exists()) ? convertToUserPath(paradataFolder) : FileUtils.convertToPath(paradataFolder,inputDirectory); - Path reportingDataFile = (reportingFolder != null && new File(reportingFolder).exists()) ? convertToUserPath(reportingFolder) : FileUtils.convertToPath(reportingFolder,inputDirectory); - Path vtlFile = FileUtils.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); + Path paradataPath = (paradataFolder != null && new File(paradataFolder).exists()) ? convertToUserPath(paradataFolder) : fileUtilsInterface.convertToPath(paradataFolder,inputDirectory); + Path reportingDataFile = (reportingFolder != null && new File(reportingFolder).exists()) ? convertToUserPath(reportingFolder) : fileUtilsInterface.convertToPath(reportingFolder,inputDirectory); + Path vtlFile = fileUtilsInterface.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); ModeInputs modeInputs = new ModeInputs(); modeInputs.setDataFile(dataPath); modeInputs.setDdiUrl(ddiFile); @@ -65,9 +65,9 @@ private void readUserInputs() throws UnknownDataFormatException, MissingMandator } // multimodeDatasetName = readField(userInputs, "multimode_dataset_name"); - vtlReconciliationFile = FileUtils.convertToPath(readField(userInputs, "reconciliation_specifications"),inputDirectory); - vtlTransformationsFile = FileUtils.convertToPath(readField(userInputs, "transformation_specifications"),inputDirectory); - vtlInformationLevelsFile = FileUtils.convertToPath(readField(userInputs, "information_levels_specifications"),inputDirectory); + vtlReconciliationFile = fileUtilsInterface.convertToPath(readField(userInputs, "reconciliation_specifications"),inputDirectory); + vtlTransformationsFile = fileUtilsInterface.convertToPath(readField(userInputs, "transformation_specifications"),inputDirectory); + vtlInformationLevelsFile = fileUtilsInterface.convertToPath(readField(userInputs, "information_levels_specifications"),inputDirectory); } catch (IOException e) { log.error("Unable to read user input file: {} , {}", userInputFile, e); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java index f62a5125..81048103 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java @@ -6,7 +6,7 @@ import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.exceptions.MissingMandatoryFieldException; import fr.insee.kraftwerk.core.exceptions.UnknownDataFormatException; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.JsonFileReader; import lombok.extern.log4j.Log4j2; @@ -24,8 +24,8 @@ public class UserInputsGenesis extends UserInputs{ private final List modes; - public UserInputsGenesis(boolean hasConfigFile, Path inputDirectory, List modes) throws KraftwerkException, IOException { - super(inputDirectory); + public UserInputsGenesis(boolean hasConfigFile, Path inputDirectory, List modes, FileUtilsInterface fileUtilsInterface) throws KraftwerkException, IOException { + super(inputDirectory, fileUtilsInterface); this.hasConfigFile = hasConfigFile; this.modes=modes; computeInputs(); @@ -34,7 +34,7 @@ public UserInputsGenesis(boolean hasConfigFile, Path inputDirectory, List private void computeInputs() throws KraftwerkException, IOException { UserInputsFile userInputsFile; if(hasConfigFile){ - userInputsFile = new UserInputsFile(inputDirectory.resolve(Constants.USER_INPUT_FILE), inputDirectory); + userInputsFile = new UserInputsFile(inputDirectory.resolve(Constants.USER_INPUT_FILE), inputDirectory, fileUtilsInterface); modeInputsMap = userInputsFile.getModeInputsMap(); }else{ for (Mode mode : modes) { @@ -75,7 +75,7 @@ private Path getModeVtlFile(Mode mode) throws UnknownDataFormatException, Missin String dataMode = readField(fileNode, "data_mode"); if (dataMode == null) {break;} if (dataMode.equals(mode.name())) { - return FileUtils.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); + return fileUtilsInterface.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); } } } catch (IOException e) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java index 093cd170..a5f52b31 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java @@ -4,7 +4,7 @@ import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.metadata.MetadataModel; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.Getter; @@ -40,7 +40,7 @@ protected OutputFiles(Path outDirectory, VtlBindings vtlBindings, List m /** Create output folder if doesn't exist. */ private void createOutputFolder() { - FileUtils.createDirectoryIfNotExist(outputFolder); + FileSystemImpl.createDirectoryIfNotExist(outputFolder); } /** See getOutputDatasetNames doc. */ diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java index 97e63c73..e39b0354 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java @@ -15,7 +15,7 @@ import fr.insee.kraftwerk.core.rawdata.GroupInstance; import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; @@ -32,7 +32,7 @@ public BuildBindingsSequenceGenesis() { vtlExecute = new VtlExecute(); } - public void buildVtlBindings(String dataMode, VtlBindings vtlBindings, Map metadataModels, List surveyUnits, Path inDirectory) throws NullException { + public void buildVtlBindings(String dataMode, VtlBindings vtlBindings, Map metadataModels, List surveyUnits, Path inDirectory, FileUtilsInterface fileUtilsInterface) throws NullException { SurveyRawData data = new SurveyRawData(); /* Step 2.0 : Read the DDI file (and Lunatic Json for missing variables) to get survey variables */ @@ -72,7 +72,7 @@ public void buildVtlBindings(String dataMode, VtlBindings vtlBindings, Map listFiles = FileUtils.listFiles(reportingDataFile.toString()); + List listFiles = fileUtilsInterface.listFiles(reportingDataFile.toString()); for (String file : listFiles) { ReportingData reportingData = new ReportingData(reportingDataFile.resolve(file)); if (file.contains(".xml")) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java index df381158..d83af81e 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java @@ -7,6 +7,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.inputs.UserInputsFile; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import lombok.extern.log4j.Log4j2; @Log4j2 @@ -19,8 +20,8 @@ public ControlInputSequence(String defaultDirectory) { this.defaultDirectory = defaultDirectory; } - public UserInputsFile getUserInputs(Path inDirectory) throws KraftwerkException { - return new UserInputsFile(inDirectory.resolve(Constants.USER_INPUT_FILE), inDirectory); + public UserInputsFile getUserInputs(Path inDirectory, FileUtilsInterface fileUtilsInterface) throws KraftwerkException { + return new UserInputsFile(inDirectory.resolve(Constants.USER_INPUT_FILE), inDirectory, fileUtilsInterface); } public Path getInDirectory(String inDirectoryParam) throws KraftwerkException { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/MultimodalSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/MultimodalSequence.java index 46c77555..4bca68c9 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/MultimodalSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/MultimodalSequence.java @@ -12,7 +12,7 @@ import fr.insee.kraftwerk.core.dataprocessing.ReconciliationProcessing; import fr.insee.kraftwerk.core.inputs.UserInputs; import fr.insee.kraftwerk.core.metadata.MetadataModel; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.NoArgsConstructor; @@ -20,31 +20,31 @@ @NoArgsConstructor public class MultimodalSequence { - public void multimodalProcessing(UserInputs userInputs, VtlBindings vtlBindings, List errors, Map metadataModels) { + public void multimodalProcessing(UserInputs userInputs, VtlBindings vtlBindings, List errors, Map metadataModels, FileUtilsInterface fileUtilsInterface) { String multimodeDatasetName = Constants.MULTIMODE_DATASET_NAME; /* Step 3.1 : aggregate unimodal datasets into a multimodal unique dataset */ DataProcessing reconciliationProcessing = new ReconciliationProcessing(vtlBindings); String vtlGenerate = reconciliationProcessing.applyVtlTransformations(multimodeDatasetName, userInputs.getVtlReconciliationFile(), errors); - TextFileWriter.writeFile(FileUtils.getTempVtlFilePath(userInputs, "ReconciliationProcessing",multimodeDatasetName), vtlGenerate); + TextFileWriter.writeFile(fileUtilsInterface.getTempVtlFilePath(userInputs, "ReconciliationProcessing",multimodeDatasetName), vtlGenerate); /* Step 3.1.b : clean up processing */ CleanUpProcessing cleanUpProcessing = new CleanUpProcessing(vtlBindings, metadataModels); vtlGenerate = cleanUpProcessing.applyVtlTransformations(multimodeDatasetName, null, errors); - TextFileWriter.writeFile(FileUtils.getTempVtlFilePath(userInputs, "CleanUpProcessing",multimodeDatasetName), vtlGenerate); + TextFileWriter.writeFile(fileUtilsInterface.getTempVtlFilePath(userInputs, "CleanUpProcessing",multimodeDatasetName), vtlGenerate); /* Step 3.2 : treatments on the multimodal dataset */ DataProcessing multimodeTransformations = new MultimodeTransformations(vtlBindings); vtlGenerate = multimodeTransformations.applyVtlTransformations(multimodeDatasetName, userInputs.getVtlTransformationsFile(), errors); - TextFileWriter.writeFile(FileUtils.getTempVtlFilePath(userInputs, "MultimodeTransformations",multimodeDatasetName), vtlGenerate); + TextFileWriter.writeFile(fileUtilsInterface.getTempVtlFilePath(userInputs, "MultimodeTransformations",multimodeDatasetName), vtlGenerate); /* Step 3.3 : create datasets on each information level (i.e. each group) */ DataProcessing informationLevelsProcessing = new InformationLevelsProcessing(vtlBindings); vtlGenerate = informationLevelsProcessing.applyVtlTransformations(multimodeDatasetName, userInputs.getVtlInformationLevelsFile(), errors); - TextFileWriter.writeFile(FileUtils.getTempVtlFilePath(userInputs, "InformationLevelsProcessing",multimodeDatasetName), vtlGenerate); + TextFileWriter.writeFile(fileUtilsInterface.getTempVtlFilePath(userInputs, "InformationLevelsProcessing",multimodeDatasetName), vtlGenerate); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java index d7263549..0dbc6f98 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java @@ -6,7 +6,7 @@ import fr.insee.kraftwerk.core.inputs.ModeInputs; import fr.insee.kraftwerk.core.inputs.UserInputs; import fr.insee.kraftwerk.core.metadata.*; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.NoArgsConstructor; @@ -21,7 +21,7 @@ public class UnimodalSequence { public void applyUnimodalSequence(UserInputs userInputs, String dataMode, VtlBindings vtlBindings, - List errors, Map metadataModels) { + List errors, Map metadataModels, FileUtilsInterface fileUtilsInterface) { ModeInputs modeInputs = userInputs.getModeInputs(dataMode); String vtlGenerate; @@ -44,7 +44,7 @@ public void applyUnimodalSequence(UserInputs userInputs, String dataMode, VtlBin .getCalculatedFromLunatic(modeInputs.getLunaticFile()); CalculatedProcessing calculatedProcessing = new CalculatedProcessing(vtlBindings, calculatedVariables); vtlGenerate = calculatedProcessing.applyCalculatedVtlTransformations(dataMode, modeInputs.getModeVtlFile(), errors); - TextFileWriter.writeFile(FileUtils.getTempVtlFilePath(userInputs, "CalculatedProcessing", dataMode), + TextFileWriter.writeFile(fileUtilsInterface.getTempVtlFilePath(userInputs, "CalculatedProcessing", dataMode), vtlGenerate); } else { @@ -53,7 +53,7 @@ public void applyUnimodalSequence(UserInputs userInputs, String dataMode, VtlBin /* Step 2.4c : Prefix variable names with their belonging group names */ vtlGenerate = new GroupProcessing(vtlBindings, metadataModels.get(dataMode)).applyVtlTransformations(dataMode, null, errors); - TextFileWriter.writeFile(FileUtils.getTempVtlFilePath(userInputs, "GroupProcessing", dataMode), vtlGenerate); + TextFileWriter.writeFile(fileUtilsInterface.getTempVtlFilePath(userInputs, "GroupProcessing", dataMode), vtlGenerate); /* Step 2.5 : Apply standard mode-specific VTL transformations */ UnimodalDataProcessing dataProcessing = DataProcessingManager.getProcessingClass(modeInputs.getDataFormat(), @@ -64,16 +64,16 @@ public void applyUnimodalSequence(UserInputs userInputs, String dataMode, VtlBin .resolve("unimode") .resolve(dataMode+".vtl"), errors); - TextFileWriter.writeFile(FileUtils.getTempVtlFilePath(userInputs, "StandardVtl", dataMode), vtlGenerate); + TextFileWriter.writeFile(fileUtilsInterface.getTempVtlFilePath(userInputs, "StandardVtl", dataMode), vtlGenerate); /* Step 2.5b : Apply TCM VTL transformations */ TCMSequencesProcessing tcmSequencesProcessing = new TCMSequencesProcessing(vtlBindings,metadataModels.get(dataMode) , Constants.VTL_FOLDER_PATH); vtlGenerate = tcmSequencesProcessing.applyAutomatedVtlInstructions(dataMode, errors); - TextFileWriter.writeFile(FileUtils.getTempVtlFilePath(userInputs, "TCMSequenceVTL", dataMode), vtlGenerate); + TextFileWriter.writeFile(fileUtilsInterface.getTempVtlFilePath(userInputs, "TCMSequenceVTL", dataMode), vtlGenerate); /* Step 2.5c : Apply user specified mode-specific VTL transformations */ vtlGenerate = dataProcessing.applyVtlTransformations(dataMode, modeInputs.getModeVtlFile(), errors); - TextFileWriter.writeFile(FileUtils.getTempVtlFilePath(userInputs, dataProcessing.getStepName(), dataMode), + TextFileWriter.writeFile(fileUtilsInterface.getTempVtlFilePath(userInputs, dataProcessing.getStepName(), dataMode), vtlGenerate); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/VtlReaderWriterSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/VtlReaderWriterSequence.java index 7356e6f5..9263217c 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/VtlReaderWriterSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/VtlReaderWriterSequence.java @@ -4,7 +4,7 @@ import java.nio.file.Path; import fr.insee.kraftwerk.core.dataprocessing.StepEnum; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; @@ -29,7 +29,7 @@ public void readDataset(String pathBindings,String bindingName,VtlBindings vtlBi } public void writeTempBindings(Path inDirectory, String dataMode, VtlBindings vtlBindings, StepEnum step) { - Path tempOutputPath = FileUtils.transformToTemp(inDirectory).resolve(dataMode+"_"+step.getStepLabel()+JSON); + Path tempOutputPath = FileUtilsInterface.transformToTemp(inDirectory).resolve(dataMode+"_"+step.getStepLabel()+JSON); vtlExecute.writeJsonDataset(dataMode, tempOutputPath, vtlBindings); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java index fc2b8a86..f73a4290 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java @@ -7,7 +7,7 @@ import fr.insee.kraftwerk.core.outputs.OutputFiles; import fr.insee.kraftwerk.core.outputs.csv.CsvOutputFiles; import fr.insee.kraftwerk.core.outputs.parquet.ParquetOutputFiles; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.log.KraftwerkExecutionLog; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.NoArgsConstructor; @@ -26,7 +26,7 @@ public void writeOutputFiles(Path inDirectory,LocalDateTime executionDateTime, V } public void writeOutputFiles(Path inDirectory, LocalDateTime localDateTime, VtlBindings vtlBindings, Map modeInputsMap, Map metadataModels, List errors, KraftwerkExecutionLog kraftwerkExecutionLog) throws KraftwerkException { - Path outDirectory = FileUtils.transformToOut(inDirectory,localDateTime); + Path outDirectory = FileUtilsInterface.transformToOut(inDirectory,localDateTime); /* Step 4.1 : write csv output tables */ OutputFiles csvOutputFiles = new CsvOutputFiles(outDirectory, vtlBindings, new ArrayList<>(modeInputsMap.keySet()),kraftwerkExecutionLog); csvOutputFiles.writeOutputTables(metadataModels); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileUtils.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileSystemImpl.java similarity index 70% rename from kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileUtils.java rename to kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileSystemImpl.java index 6b83ea3e..49d9e416 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileUtils.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileSystemImpl.java @@ -1,12 +1,11 @@ package fr.insee.kraftwerk.core.utils; -import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.inputs.ModeInputs; import fr.insee.kraftwerk.core.inputs.UserInputs; import fr.insee.kraftwerk.core.inputs.UserInputsFile; +import lombok.NoArgsConstructor; import lombok.extern.log4j.Log4j2; -import org.springframework.util.FileSystemUtils; import java.io.File; import java.io.IOException; @@ -16,53 +15,23 @@ import java.net.URL; import java.nio.file.Files; import java.nio.file.Path; -import java.time.LocalDateTime; -import java.time.format.DateTimeFormatter; import java.util.Arrays; import java.util.List; import java.util.regex.Pattern; import java.util.stream.Stream; @Log4j2 -public class FileUtils { - - private FileUtils(){ - throw new IllegalStateException("Utility class"); - } +@NoArgsConstructor +public class FileSystemImpl implements FileUtilsInterface{ private static final String ARCHIVE = "Archive"; - /** - * Change /some/path/in/campaign-name to /some/path/out/campaign-name - */ - public static Path transformToOut(Path inDirectory) { - return transformToOther(inDirectory, "out"); - } - public static Path transformToOut(Path inDirectory, LocalDateTime localDateTime) { - return transformToOther(inDirectory, "out").resolve(localDateTime.format(DateTimeFormatter.ofPattern(Constants.OUTPUT_FOLDER_DATETIME_PATTERN))); - } - - /** - * Change /some/path/in/campaign-name to /some/path/temp/campaign-name - */ - public static Path transformToTemp(Path inDirectory) { - return transformToOther(inDirectory, "temp"); - } - - /** - * Change /some/path/in/campaign-name to /some/path/__other__/campaign-name - */ - private static Path transformToOther(Path inDirectory, String other) { - return "in".equals(inDirectory.getFileName().toString()) ? inDirectory.getParent().resolve(other) - : transformToOther(inDirectory.getParent(),other).resolve(inDirectory.getFileName()); - } - /** * Move the input file to another directory to archive it */ - public static void renameInputFile(Path inDirectory) { + public void renameInputFile(Path inDirectory) { File file = inDirectory.resolve("kraftwerk.json").toFile(); String fileWithTime = "kraftwerk-" + DateUtils.getCurrentTimeStamp() + ".json"; @@ -81,7 +50,7 @@ public static void renameInputFile(Path inDirectory) { } } - public static void archiveInputFiles(UserInputsFile userInputsFile) throws KraftwerkException { + public void archiveInputFiles(UserInputsFile userInputsFile) throws KraftwerkException { // Path inputFolder = userInputsFile.getInputDirectory(); String[] directories = inputFolder.toString().split(Pattern.quote(File.separator)); @@ -105,7 +74,7 @@ public static void archiveInputFiles(UserInputsFile userInputsFile) throws Kraft * @param modeInputs * @throws KraftwerkException */ - private static void archiveReportingData(Path inputFolder, String campaignName, ModeInputs modeInputs) + private void archiveReportingData(Path inputFolder, String campaignName, ModeInputs modeInputs) throws KraftwerkException { if (modeInputs.getReportingDataFile() != null) { moveDirectory(modeInputs.getReportingDataFile().toFile(), inputFolder.resolve(ARCHIVE) @@ -120,7 +89,7 @@ private static void archiveReportingData(Path inputFolder, String campaignName, * @param modeInputs * @throws KraftwerkException */ - private static void archiveParadata(Path inputFolder, String campaignName, ModeInputs modeInputs) + private void archiveParadata(Path inputFolder, String campaignName, ModeInputs modeInputs) throws KraftwerkException { if (modeInputs.getParadataFolder() != null) { moveDirectory(modeInputs.getParadataFolder().toFile(), inputFolder.resolve(ARCHIVE) @@ -128,7 +97,7 @@ private static void archiveParadata(Path inputFolder, String campaignName, ModeI } } - private static void archiveData(Path inputFolder, String campaignName, ModeInputs modeInputs) + private void archiveData(Path inputFolder, String campaignName, ModeInputs modeInputs) throws KraftwerkException { Path dataPath = modeInputs.getDataFile(); Path newDataPath = inputFolder.resolve(ARCHIVE).resolve(getRoot(dataPath, campaignName)); @@ -145,13 +114,13 @@ private static void archiveData(Path inputFolder, String campaignName, ModeInput } } - private static void createArchiveDirectoryIfNotExists(Path inputFolder) { + private void createArchiveDirectoryIfNotExists(Path inputFolder) { if (!Files.exists(inputFolder.resolve(ARCHIVE))) { inputFolder.resolve(ARCHIVE).toFile().mkdir(); } } - private static void moveFile(Path dataPath, Path newDataPath) throws KraftwerkException { + private void moveFile(Path dataPath, Path newDataPath) throws KraftwerkException { try { Files.move(dataPath, newDataPath); } catch (IOException e) { @@ -160,7 +129,7 @@ private static void moveFile(Path dataPath, Path newDataPath) throws KraftwerkEx } - private static void moveDirectory(File sourceFile, File destFile) throws KraftwerkException { + private void moveDirectory(File sourceFile, File destFile) throws KraftwerkException { if (sourceFile.isDirectory()) { File[] files = sourceFile.listFiles(); assert files != null : "List of files in sourceFile is null"; @@ -179,7 +148,7 @@ private static void moveDirectory(File sourceFile, File destFile) throws Kraftwe } } - private static String getRoot(Path path, String campaignName) { + private String getRoot(Path path, String campaignName) { String[] directories = path.toString().split(Pattern.quote(File.separator)); int campaignIndex = Arrays.asList(directories).indexOf(campaignName); String[] newDirectories = Arrays.copyOfRange(directories, campaignIndex + 1, directories.length); @@ -193,9 +162,9 @@ private static String getRoot(Path path, String campaignName) { } - public static void deleteDirectory(Path directoryPath) throws KraftwerkException { + public void deleteDirectory(Path directoryPath) throws KraftwerkException { try { - FileSystemUtils.deleteRecursively(directoryPath); + org.springframework.util.FileSystemUtils.deleteRecursively(directoryPath); } catch (IOException e) { throw new KraftwerkException(500, "IOException when deleting temp folder : "+e.getMessage()); } @@ -206,16 +175,16 @@ public static void deleteDirectory(Path directoryPath) throws KraftwerkException * @param dir * @return */ - public static List listFiles(String dir) { + public List listFiles(String dir) { return Stream.of(new File(dir).listFiles()) .filter(file -> !file.isDirectory()) .map(File::getName) .toList(); } - public static Path getTempVtlFilePath(UserInputs userInputs, String step, String dataset) { - createDirectoryIfNotExist(FileUtils.transformToTemp(userInputs.getInputDirectory())); - return FileUtils.transformToTemp(userInputs.getInputDirectory()).resolve(step+ dataset+".vtl"); + public Path getTempVtlFilePath(UserInputs userInputs, String step, String dataset) { + createDirectoryIfNotExist(FileUtilsInterface.transformToTemp(userInputs.getInputDirectory())); + return FileUtilsInterface.transformToTemp(userInputs.getInputDirectory()).resolve(step+ dataset+".vtl"); } public static void createDirectoryIfNotExist(Path path) { @@ -227,7 +196,7 @@ public static void createDirectoryIfNotExist(Path path) { } } - public static Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException { + public Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException { if (userField != null && !"null".equals(userField) && !userField.isEmpty()) { Path inputPath = inputDirectory.resolve(userField); if (!new File(inputPath.toUri()).exists()) { @@ -239,7 +208,7 @@ public static Path convertToPath(String userField, Path inputDirectory) throws K } } - public static URL convertToUrl(String userField, Path inputDirectory) { + public URL convertToUrl(String userField, Path inputDirectory) { if (userField == null) { log.debug("null value out of method that reads DDI field (should not happen)."); return null; @@ -254,5 +223,4 @@ public static URL convertToUrl(String userField, Path inputDirectory) { return null; } } - } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileUtilsInterface.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileUtilsInterface.java new file mode 100644 index 00000000..2b221d53 --- /dev/null +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileUtilsInterface.java @@ -0,0 +1,51 @@ +package fr.insee.kraftwerk.core.utils; + +import fr.insee.kraftwerk.core.Constants; +import fr.insee.kraftwerk.core.exceptions.KraftwerkException; +import fr.insee.kraftwerk.core.inputs.UserInputs; +import fr.insee.kraftwerk.core.inputs.UserInputsFile; + +import java.net.URL; +import java.nio.file.Path; +import java.time.LocalDateTime; +import java.time.format.DateTimeFormatter; +import java.util.List; + +public interface FileUtilsInterface { + static Path transformToOut(Path inDirectory) { + return transformToOther(inDirectory, "out"); + } + + static Path transformToOut(Path inDirectory, LocalDateTime localDateTime) { + return transformToOther(inDirectory, "out").resolve(localDateTime.format(DateTimeFormatter.ofPattern(Constants.OUTPUT_FOLDER_DATETIME_PATTERN))); + } + + /** + * Change /some/path/in/campaign-name to /some/path/temp/campaign-name + */ + static Path transformToTemp(Path inDirectory) { + return transformToOther(inDirectory, "temp"); + } + + /** + * Change /some/path/in/campaign-name to /some/path/__other__/campaign-name + */ + private static Path transformToOther(Path inDirectory, String other) { + return "in".equals(inDirectory.getFileName().toString()) ? inDirectory.getParent().resolve(other) + : transformToOther(inDirectory.getParent(), other).resolve(inDirectory.getFileName()); + } + + void renameInputFile(Path inDirectory); + + void archiveInputFiles(UserInputsFile userInputsFile) throws KraftwerkException; + + void deleteDirectory(Path directoryPath) throws KraftwerkException; + + List listFiles(String dir); + + Path getTempVtlFilePath(UserInputs userInputs, String step, String dataset); + + Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException; + + URL convertToUrl(String userField, Path inputDirectory); +} diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java index 22b1073d..5fbfa75c 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java @@ -37,9 +37,9 @@ public static void writeFile(Path filePath, String fileContent){ } public static void writeErrorsFile(Path inDirectory, LocalDateTime localDateTime, List errors) { - Path tempOutputPath = FileUtils.transformToOut(inDirectory,localDateTime) + Path tempOutputPath = FileUtilsInterface.transformToOut(inDirectory,localDateTime) .resolve(Constants.ERRORS_FILE_NAME); - FileUtils.createDirectoryIfNotExist(tempOutputPath.getParent()); + FileSystemImpl.createDirectoryIfNotExist(tempOutputPath.getParent()); //Write errors file if (!errors.isEmpty()) { @@ -57,9 +57,9 @@ public static void writeErrorsFile(Path inDirectory, LocalDateTime localDateTime } public static void writeLogFile(Path inDirectory, LocalDateTime localDateTime, KraftwerkExecutionLog kraftwerkExecutionLog){ - Path tempOutputPath = FileUtils.transformToOut(inDirectory,localDateTime); + Path tempOutputPath = FileUtilsInterface.transformToOut(inDirectory,localDateTime); tempOutputPath = tempOutputPath.resolve(inDirectory.getFileName() + "_LOG_" + kraftwerkExecutionLog.getStartTimeStamp() +".txt"); - FileUtils.createDirectoryIfNotExist(tempOutputPath.getParent()); + FileSystemImpl.createDirectoryIfNotExist(tempOutputPath.getParent()); try (FileWriter myWriter = new FileWriter(tempOutputPath.toFile(),true)){ myWriter.write(kraftwerkExecutionLog.getFormattedString()); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java index deea20d9..e5f4ff56 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java @@ -22,7 +22,7 @@ private XMLSplitter() { public static void split(String inputfolder, String xmlfile, String outputFolder, String condition, int nbElementsByFile) throws XMLStreamException, IOException { - FileUtils.createDirectoryIfNotExist(Paths.get(outputFolder)); + FileSystemImpl.createDirectoryIfNotExist(Paths.get(outputFolder)); String xmlResource = inputfolder + xmlfile; List header = getHeader(xmlResource, condition); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java index 51b540d5..64fa9ae0 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java @@ -5,7 +5,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.vtl.jackson.TrevasModule; import fr.insee.vtl.model.Dataset; @@ -118,7 +118,7 @@ public void putVtlDataset(String filePath, String bindingName, VtlBindings bindi * @param jsonOutFile Path to write the output json file. * */ public void writeJsonDataset(String bindingName, Path jsonOutFile, VtlBindings bindings) { - FileUtils.createDirectoryIfNotExist(jsonOutFile.getParent()); + FileSystemImpl.createDirectoryIfNotExist(jsonOutFile.getParent()); //Write file if (bindings.containsKey(bindingName)) { diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java index 5eb1dc44..7e94738e 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java @@ -10,6 +10,8 @@ import java.nio.file.Path; import java.util.Set; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import org.junit.jupiter.api.Test; import fr.insee.kraftwerk.core.TestConstants; @@ -21,12 +23,14 @@ class UserInputsFileTest { private static final Path inputSamplesDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "user_inputs"); + private static final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + @Test void testReadValidUserInput_singleMode() throws KraftwerkException { UserInputsFile userInputsFile = new UserInputsFile( inputSamplesDirectory.resolve("inputs_valid.json"), - inputSamplesDirectory); + inputSamplesDirectory, fileUtilsInterface); // ModeInputs modeInputs = userInputsFile.getModeInputs("CAPI"); assertNotNull(modeInputs.getDataFile()); @@ -46,14 +50,14 @@ void testReadValidUserInput_singleMode() throws KraftwerkException { void testReadValidUserInput_missingOptionalFields() { assertDoesNotThrow(() -> new UserInputsFile( inputSamplesDirectory.resolve("inputs_valid_missing_fields.json"), - inputSamplesDirectory)); + inputSamplesDirectory, fileUtilsInterface)); } @Test void testReadValidUserInput_severalModes() throws KraftwerkException { UserInputsFile userInputsFile = new UserInputsFile( inputSamplesDirectory.resolve("inputs_valid_several_modes.json"), - inputSamplesDirectory); + inputSamplesDirectory, fileUtilsInterface); // assertTrue(userInputsFile.getModes().containsAll(Set.of("CAPI", "CAWI", "PAPI"))); // @@ -75,7 +79,7 @@ void testReadValidUserInput_severalModes() throws KraftwerkException { void testReadInvalidUserInput_wrongDataFormat() { Path path = inputSamplesDirectory.resolve("inputs_invalid_data_format.json"); assertThrows(UnknownDataFormatException.class, () -> { - new UserInputsFile(path,inputSamplesDirectory); + new UserInputsFile(path,inputSamplesDirectory, fileUtilsInterface); }); } @@ -83,7 +87,7 @@ void testReadInvalidUserInput_wrongDataFormat() { void testReadInvalidUserInput_wrongFieldNames() { Path path = inputSamplesDirectory.resolve("inputs_invalid_field_names.json"); assertThrows(MissingMandatoryFieldException.class, () -> { - new UserInputsFile( path,inputSamplesDirectory); + new UserInputsFile( path,inputSamplesDirectory, fileUtilsInterface); }); } @@ -91,7 +95,7 @@ void testReadInvalidUserInput_wrongFieldNames() { void testReadMalformedInput() throws KraftwerkException { Path path = inputSamplesDirectory.resolve("inputs_invalid_malformed.json"); assertThrows(UnknownDataFormatException.class, () -> { - new UserInputsFile(path,inputSamplesDirectory); + new UserInputsFile(path,inputSamplesDirectory, fileUtilsInterface); }); } @@ -99,7 +103,7 @@ void testReadMalformedInput() throws KraftwerkException { void testReadInputMissingFile() throws KraftwerkException { Path path = inputSamplesDirectory.resolve("inputs_invalid_several_modes_fileNotExist.json"); assertThrows(KraftwerkException.class, () -> { - new UserInputsFile(path,inputSamplesDirectory); + new UserInputsFile(path,inputSamplesDirectory, fileUtilsInterface); }); } @@ -107,7 +111,7 @@ void testReadInputMissingFile() throws KraftwerkException { void testReadInputCompletePath() throws KraftwerkException { Path path = inputSamplesDirectory.resolve("inputs_valid_several_modes_completePath.json"); assertDoesNotThrow(() -> { - new UserInputsFile(path,inputSamplesDirectory); + new UserInputsFile(path,inputSamplesDirectory, fileUtilsInterface); }); } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesisTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesisTest.java index 1b77e367..2673c45e 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesisTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesisTest.java @@ -4,6 +4,7 @@ import fr.insee.kraftwerk.core.data.model.Mode; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.parsers.DataFormat; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; import org.junit.jupiter.api.Test; import java.io.IOException; @@ -22,7 +23,7 @@ void testReadValidUserInput_singleMode() throws KraftwerkException, IOException List modes = new ArrayList<>(); modes.add(Mode.F2F); - UserInputsGenesis userInputsGenesis = new UserInputsGenesis(false, inputSamplesDirectory.resolve("Valid"), modes); + UserInputsGenesis userInputsGenesis = new UserInputsGenesis(false, inputSamplesDirectory.resolve("Valid"), modes, new FileSystemImpl()); // ModeInputs modeInputs = userInputsGenesis.getModeInputs("F2F"); assertNotNull(modeInputs.getDdiUrl()); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java index 06d7c189..c5b8c606 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java @@ -10,6 +10,8 @@ import java.util.List; import java.util.Set; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import org.junit.jupiter.api.MethodOrderer.OrderAnnotation; import org.junit.jupiter.api.Order; import org.junit.jupiter.api.Test; @@ -30,6 +32,8 @@ class CsvOutputFilesTest { private static UserInputsFile testUserInputsFile; private static OutputFiles outputFiles; + private static final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + Dataset fooDataset = new InMemoryDataset(List.of(), List.of(new Structured.Component("FOO", String.class, Dataset.Role.IDENTIFIER))); @@ -40,7 +44,7 @@ void createInstance() { // testUserInputsFile = new UserInputsFile( Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "user_inputs/inputs_valid_several_modes.json"), - Path.of(TestConstants.UNIT_TESTS_DIRECTORY,"user_inputs")); + Path.of(TestConstants.UNIT_TESTS_DIRECTORY,"user_inputs"), fileUtilsInterface); // VtlBindings vtlBindings = new VtlBindings(); for (String mode : testUserInputsFile.getModes()) { diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvTableWriterTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvTableWriterTest.java index 2e41c629..de40c28b 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvTableWriterTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvTableWriterTest.java @@ -9,7 +9,7 @@ import fr.insee.kraftwerk.core.metadata.VariableType; import fr.insee.kraftwerk.core.outputs.csv.CsvTableWriter; import fr.insee.kraftwerk.core.utils.CsvUtils; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; import fr.insee.vtl.model.Dataset; import fr.insee.vtl.model.Dataset.Role; import fr.insee.vtl.model.InMemoryDataset; @@ -64,7 +64,7 @@ class CsvTableWriterTest { void writeCsvFromDatasetTest() throws IOException, CsvException { // Clean the existing file Files.deleteIfExists(outTestFilePath); - FileUtils.createDirectoryIfNotExist(outTestFilePath.getParent()); + FileSystemImpl.createDirectoryIfNotExist(outTestFilePath.getParent()); Map metaModels = new HashMap<>(); MetadataModel metadataModel = new MetadataModel(); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java index 43798f8c..e807a8c7 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java @@ -1,6 +1,5 @@ package fr.insee.kraftwerk.core.outputs; -import com.opencsv.exceptions.CsvException; import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.TestConstants; import fr.insee.kraftwerk.core.inputs.UserInputsFile; @@ -9,7 +8,8 @@ import fr.insee.kraftwerk.core.metadata.Variable; import fr.insee.kraftwerk.core.metadata.VariableType; import fr.insee.kraftwerk.core.outputs.parquet.ParquetOutputFiles; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.vtl.model.Dataset; import fr.insee.vtl.model.Dataset.Role; @@ -22,7 +22,6 @@ import org.junit.jupiter.api.TestMethodOrder; import java.io.File; -import java.io.IOException; import java.nio.file.Path; import java.nio.file.Paths; import java.util.HashMap; @@ -38,6 +37,7 @@ class ParquetOutputFilesTest { private static UserInputsFile testUserInputs; private static ParquetOutputFiles outputFiles; + private static final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); Dataset testDataset = new InMemoryDataset( @@ -61,7 +61,7 @@ void createInstance() { // testUserInputs = new UserInputsFile( Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "user_inputs/inputs_valid_several_modes.json"), - Path.of(TestConstants.UNIT_TESTS_DIRECTORY,"user_inputs")); + Path.of(TestConstants.UNIT_TESTS_DIRECTORY,"user_inputs"), fileUtilsInterface); // VtlBindings vtlBindings = new VtlBindings(); for (String mode : testUserInputs.getModes()) { @@ -93,11 +93,11 @@ void testGetDatasetOutputNames() { @Test @Order(3) - void writeParquetFromDatasetTest() throws IOException, CsvException { + void writeParquetFromDatasetTest(){ // Clean the existing file // Files.deleteIfExists(outputFiles.getOutputFolder()); - FileUtils.createDirectoryIfNotExist(outputFiles.getOutputFolder()); + FileSystemImpl.createDirectoryIfNotExist(outputFiles.getOutputFolder()); Map metaModels = new HashMap<>(); MetadataModel metMod = new MetadataModel(); @@ -116,20 +116,4 @@ void writeParquetFromDatasetTest() throws IOException, CsvException { Assertions.assertNotEquals(0, f.length()); } - - - - - - - - boolean deleteDirectory(File directoryToBeDeleted) { - File[] allContents = directoryToBeDeleted.listFiles(); - if (allContents != null) { - for (File file : allContents) { - deleteDirectory(file); - } - } - return directoryToBeDeleted.delete(); - } } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java index d954e29d..cb1d3999 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java @@ -7,6 +7,8 @@ import fr.insee.kraftwerk.core.metadata.UcqVariable; import fr.insee.kraftwerk.core.metadata.Variable; import fr.insee.kraftwerk.core.metadata.VariableType; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import org.junit.jupiter.api.Test; import org.junit.jupiter.params.ParameterizedTest; @@ -20,6 +22,8 @@ class BuildBindingsSequenceTest { private static final Path inputSamplesDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "user_inputs"); + private static final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + @Test @@ -27,7 +31,7 @@ void buildVtlBindings_errorWithoutMetadata() throws KraftwerkException { //GIVEN UserInputsFile userInputsFile = new UserInputsFile( inputSamplesDirectory.resolve("inputs_valid.json"), - inputSamplesDirectory); + inputSamplesDirectory, fileUtilsInterface); String dataMode = "CAPI"; VtlBindings vtlBindings = new VtlBindings(); boolean withAllReportingData = false; @@ -47,7 +51,7 @@ void buildVtlBindings_success_changingDdi_and_reportingData(boolean withDdi, boo //GIVEN UserInputsFile userInputsFile = new UserInputsFile( inputSamplesDirectory.resolve("inputs_valid.json"), - inputSamplesDirectory); + inputSamplesDirectory, fileUtilsInterface); String dataMode = "CAPI"; VtlBindings vtlBindings = new VtlBindings(); BuildBindingsSequence bbs = new BuildBindingsSequence(withAllReportingData); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileUtilsTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileSystemImplTest.java similarity index 78% rename from kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileUtilsTest.java rename to kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileSystemImplTest.java index dcb6a065..c6e3ad0d 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileUtilsTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileSystemImplTest.java @@ -5,8 +5,8 @@ import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.inputs.UserInputsFile; import org.junit.jupiter.api.Assertions; +import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.api.Test; -import org.springframework.util.FileSystemUtils; import java.io.File; import java.io.IOException; @@ -14,29 +14,34 @@ import java.nio.file.Path; import java.nio.file.Paths; import java.time.LocalDateTime; -import java.util.Objects; import static org.junit.Assert.assertThrows; import static org.junit.jupiter.api.Assertions.assertEquals; -class FileUtilsTest { +class FileSystemImplTest { + private static FileUtilsInterface fileUtilsInterface; + + @BeforeAll + static void init(){ + fileUtilsInterface = new FileSystemImpl(); + } @Test void testTransformToOut() { assertEquals(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/out/VQS"), - FileUtils.transformToOut(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/in/VQS"))); + FileUtilsInterface.transformToOut(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/in/VQS"))); } @Test void testTransformToOut2() { Path path = Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/out/VQS"); - assertEquals(path,FileUtils.transformToOut(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/in/VQS"), LocalDateTime.now()).getParent()); + assertEquals(path, FileUtilsInterface.transformToOut(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/in/VQS"), LocalDateTime.now()).getParent()); } @Test void archiveInputFiles_failWhenNull() { - assertThrows(NullPointerException.class, () -> FileUtils.archiveInputFiles(null)); + assertThrows(NullPointerException.class, () -> fileUtilsInterface.archiveInputFiles(null)); } @@ -46,7 +51,7 @@ void archiveInputFiles_ok() throws IOException, KraftwerkException{ //GIVEN String campaignName = "move_files"; Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, campaignName, "execute"); - FileSystemUtils.deleteRecursively(inputDirectory); + org.springframework.util.FileSystemUtils.deleteRecursively(inputDirectory); Files.createDirectories(inputDirectory); Files.copy(Path.of(TestConstants.UNIT_TESTS_DIRECTORY, campaignName,"move_files.json"), Path.of(inputDirectory.toString(),"move_files.json")); @@ -77,11 +82,11 @@ void archiveInputFiles_ok() throws IOException, KraftwerkException{ new File(Constants.getResourceAbsolutePath(paradataDirectory +"/L0000009.json")).createNewFile(); new File(Constants.getResourceAbsolutePath(paradataDirectory +"/L0000010.json")).createNewFile(); - UserInputsFile testUserInputsFile = new UserInputsFile(Path.of(inputDirectory.toString(), "move_files.json"),inputDirectory); + UserInputsFile testUserInputsFile = new UserInputsFile(Path.of(inputDirectory.toString(), "move_files.json"),inputDirectory, fileUtilsInterface); //WHEN - FileUtils.archiveInputFiles(testUserInputsFile); + fileUtilsInterface.archiveInputFiles(testUserInputsFile); //THEN Assertions.assertTrue(new File(inputDirectory.toString() + "/Archive/papier").exists()); @@ -90,7 +95,7 @@ void archiveInputFiles_ok() throws IOException, KraftwerkException{ Assertions.assertTrue(new File(inputDirectory.toString() + "/Archive/suivi/reportingdata.xml").exists()); //CLEAN - FileSystemUtils.deleteRecursively(inputDirectory); + org.springframework.util.FileSystemUtils.deleteRecursively(inputDirectory); } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XMLSplitterTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XMLSplitterTest.java index 189a918c..7cec33fd 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XMLSplitterTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XMLSplitterTest.java @@ -24,11 +24,13 @@ class XMLSplitterTest { static final String outDirectory = TestConstants.UNIT_TESTS_DUMP+"/split/"; + static final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + @BeforeAll static void cleanUpBeforeTests() throws Exception { File file = new File(outDirectory); if (file.exists()) { - List splitFiles = FileUtils.listFiles(outDirectory); + List splitFiles = fileUtilsInterface.listFiles(outDirectory); if (splitFiles != null){ for (String splitFile : splitFiles) { if(!Files.deleteIfExists(Paths.get(outDirectory+splitFile))){ @@ -44,14 +46,14 @@ static void cleanUpBeforeTests() throws Exception { @Test @DisplayName("OutDirectory should contain 3 files") void splitInThreeTest() throws XMLStreamException, IOException { - List splitFiles = FileUtils.listFiles(outDirectory); + List splitFiles = fileUtilsInterface.listFiles(outDirectory); assertEquals(3,splitFiles.size()); } @Test @DisplayName("File split1.xml file should contain 2 survey units") void contains2SuTest() throws XMLStreamException, IOException { - List splitFiles = FileUtils.listFiles(outDirectory); + List splitFiles = fileUtilsInterface.listFiles(outDirectory); int count = 0; XMLInputFactory factory = XMLInputFactory.newInstance(); try { diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java index 806ae6ed..612ff805 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java @@ -15,7 +15,8 @@ import fr.insee.kraftwerk.core.outputs.csv.CsvOutputFiles; import fr.insee.kraftwerk.core.sequence.*; import fr.insee.kraftwerk.core.utils.CsvUtils; -import fr.insee.kraftwerk.core.utils.FileUtils; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; import io.cucumber.java.Before; @@ -63,7 +64,8 @@ public class MainDefinitions { @Before public void clean() throws KraftwerkException { - FileUtils.deleteDirectory(outDirectory); + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + fileUtilsInterface.deleteDirectory(outDirectory); } @Given("Step 0 : We have some survey in directory {string}") @@ -96,19 +98,19 @@ public void init_VTL_script(String vtlScriptName, String variableToCreate, Strin @When("Step 1 : We initialize the input files") public void initialize_input_files() throws KraftwerkException { System.out.println("InDirectory value : " + inDirectory); - userInputsFile = controlInputSequence.getUserInputs(inDirectory); + userInputsFile = controlInputSequence.getUserInputs(inDirectory, new FileSystemImpl()); vtlBindings = new VtlBindings(); } @When("Step 1 : We initialize with input file {string}") public void initialize_with_specific_input(String inputFileName) throws KraftwerkException { - userInputsFile = new UserInputsFile(inDirectory.resolve(inputFileName), inDirectory); + userInputsFile = new UserInputsFile(inDirectory.resolve(inputFileName), inDirectory, new FileSystemImpl()); vtlBindings = new VtlBindings(); } @When("Step 1 : We initialize metadata model with lunatic specification only") public void initialize_metadata_model_with_lunatic() throws KraftwerkException { - MainProcessing mp = new MainProcessing(inDirectory.toString(), false,false,false, "defaultDirectory", 419430400L); + MainProcessing mp = new MainProcessing(inDirectory.toString(), false,false,false, "defaultDirectory", 419430400L, new FileSystemImpl()); mp.init(); userInputsFile=mp.getUserInputsFile(); metadataModelMap=mp.getMetadataModels(); @@ -116,7 +118,7 @@ public void initialize_metadata_model_with_lunatic() throws KraftwerkException { @When("Step 1 : We initialize metadata model with DDI specification only") public void initialize_metadata_model_with_DDI() throws KraftwerkException { - MainProcessing mp = new MainProcessing(inDirectory.toString(), false,false,true, "defaultDirectory", 419430400L); + MainProcessing mp = new MainProcessing(inDirectory.toString(), false,false,true, "defaultDirectory", 419430400L, new FileSystemImpl()); mp.init(); userInputsFile=mp.getUserInputsFile(); metadataModelMap=mp.getMetadataModels(); @@ -127,7 +129,7 @@ public void launch_main() throws KraftwerkException { // We clean the output and the temp directory deleteDirectory(outDirectory.toFile()); deleteDirectory(tempDirectory.toFile()); - MainProcessing mp = new MainProcessing(inDirectory.toString(), false, "defaultDirectory", 419430400L); + MainProcessing mp = new MainProcessing(inDirectory.toString(), false, "defaultDirectory", 419430400L, new FileSystemImpl()); mp.runMain(); } @@ -136,10 +138,10 @@ public void launch_main_2() throws KraftwerkException, InterruptedException { // We clean the output and the temp directory deleteDirectory(outDirectory.toFile()); deleteDirectory(tempDirectory.toFile()); - MainProcessing mp = new MainProcessing(inDirectory.toString(), false, "defaultDirectory", 419430400L); + MainProcessing mp = new MainProcessing(inDirectory.toString(), false, "defaultDirectory", 419430400L, new FileSystemImpl()); mp.runMain(); await().atMost(2, TimeUnit.SECONDS); - mp = new MainProcessing(inDirectory.toString(), false, "defaultDirectory", 419430400L); + mp = new MainProcessing(inDirectory.toString(), false, "defaultDirectory", 419430400L, new FileSystemImpl()); mp.runMain(); } @@ -149,7 +151,7 @@ public void launch_main_filebyfile() throws KraftwerkException { deleteDirectory(outDirectory.toFile()); deleteDirectory(tempDirectory.toFile()); MainProcessing mp = new MainProcessing(inDirectory.toString(), true, - Paths.get(FUNCTIONAL_TESTS_INPUT_DIRECTORY).resolve(campaignName).toString(), 419430400L); + Paths.get(FUNCTIONAL_TESTS_INPUT_DIRECTORY).resolve(campaignName).toString(), 419430400L, new FileSystemImpl()); mp.runMain(); } @@ -161,14 +163,14 @@ public void unimodal_treatments() throws NullException { boolean withDDI = true; buildBindingsSequence.buildVtlBindings(userInputsFile, dataMode, vtlBindings, metadataModelMap.get(dataMode), withDDI,null); UnimodalSequence unimodal = new UnimodalSequence(); - unimodal.applyUnimodalSequence(userInputsFile, dataMode, vtlBindings, errors, metadataModelMap); + unimodal.applyUnimodalSequence(userInputsFile, dataMode, vtlBindings, errors, metadataModelMap, new FileSystemImpl()); } } @When("Step 3 : We aggregate each unimodal dataset into a multimodal dataset") public void aggregate_datasets() { MultimodalSequence multimodalSequence = new MultimodalSequence(); - multimodalSequence.multimodalProcessing(userInputsFile, vtlBindings, errors, metadataModelMap); + multimodalSequence.multimodalProcessing(userInputsFile, vtlBindings, errors, metadataModelMap, new FileSystemImpl()); } @When("Step 4 : We export the final version") @@ -282,8 +284,8 @@ boolean deleteDirectory(File directoryToBeDeleted) { } private void writeErrorsFile(Path inDirectory,LocalDateTime localDateTime, List errors) { - Path tempOutputPath = FileUtils.transformToOut(inDirectory,localDateTime).resolve(Constants.ERRORS_FILE_NAME); - FileUtils.createDirectoryIfNotExist(tempOutputPath.getParent()); + Path tempOutputPath = FileUtilsInterface.transformToOut(inDirectory,localDateTime).resolve(Constants.ERRORS_FILE_NAME); + FileSystemImpl.createDirectoryIfNotExist(tempOutputPath.getParent()); // Write errors file if (!errors.isEmpty()) { diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java index 90b31d60..5f91aab4 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java @@ -13,6 +13,8 @@ import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.sequence.ControlInputSequence; +import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.FileUtilsInterface; import io.cucumber.java.en.Given; import io.cucumber.java.en.Then; import io.cucumber.java.en.When; @@ -33,13 +35,14 @@ public class ParadataDefinitions { String userInputFileName = Constants.USER_INPUT_FILE; ModeInputs modeInputs; private ControlInputSequence controlInputSequence; + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); @Given("We read data from input named {string}") public void launch_all_steps(String campaignName) throws KraftwerkException { Path campaignDirectory = Paths.get(FUNCTIONAL_TESTS_INPUT_DIRECTORY).resolve(campaignName); controlInputSequence = new ControlInputSequence(campaignDirectory.toString()); - UserInputsFile userInputs = controlInputSequence.getUserInputs(campaignDirectory); + UserInputsFile userInputs = controlInputSequence.getUserInputs(campaignDirectory, fileUtilsInterface); // For now, only one file String modeName = userInputs.getModes().getFirst(); modeInputs = userInputs.getModeInputs(modeName); From 22b5a559953da69d3a607572dcfdbe2d3d8ba952 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Thu, 20 Jun 2024 10:19:55 +0200 Subject: [PATCH 15/46] Add minio implementation + remove Files calls to use interface + moved to package --- .../fr/insee/kraftwerk/api/KraftwerkApi.java | 3 + .../kraftwerk/api/batch/KraftwerkBatch.java | 25 +- .../api/configuration/MinioConfig.java | 15 ++ .../kraftwerk/api/process/MainProcessing.java | 2 +- .../api/process/MainProcessingGenesis.java | 2 +- .../api/services/KraftwerkService.java | 2 +- .../kraftwerk/api/services/MainService.java | 44 ++- .../api/services/SplitterService.java | 2 +- .../api/services/StepByStepService.java | 60 ++++- kraftwerk-core/pom.xml | 7 + .../kraftwerk/core/inputs/UserInputs.java | 2 +- .../kraftwerk/core/inputs/UserInputsFile.java | 2 +- .../core/inputs/UserInputsGenesis.java | 2 +- .../kraftwerk/core/outputs/OutputFiles.java | 2 +- .../BuildBindingsSequenceGenesis.java | 2 +- .../core/sequence/ControlInputSequence.java | 2 +- .../core/sequence/MultimodalSequence.java | 2 +- .../core/sequence/UnimodalSequence.java | 2 +- .../sequence/VtlReaderWriterSequence.java | 2 +- .../core/sequence/WriterSequence.java | 2 +- .../kraftwerk/core/utils/TextFileWriter.java | 2 + .../kraftwerk/core/utils/XMLSplitter.java | 2 + .../utils/{ => files}/FileSystemImpl.java | 16 +- .../utils/{ => files}/FileUtilsInterface.java | 2 +- .../kraftwerk/core/utils/files/MinioImpl.java | 253 ++++++++++++++++++ .../insee/kraftwerk/core/vtl/VtlExecute.java | 2 +- .../src/main/resources/application.properties | 6 +- .../core/inputs/UserInputsFileTest.java | 4 +- .../core/inputs/UserInputsGenesisTest.java | 2 +- .../core/outputs/CsvOutputFilesTest.java | 4 +- .../core/outputs/CsvTableWriterTest.java | 2 +- .../core/outputs/ParquetOutputFilesTest.java | 4 +- .../sequence/BuildBindingsSequenceTest.java | 4 +- .../core/utils/FileSystemImplTest.java | 2 + .../kraftwerk/core/utils/XMLSplitterTest.java | 2 + .../functional_tests/MainDefinitions.java | 4 +- .../functional_tests/ParadataDefinitions.java | 4 +- 37 files changed, 438 insertions(+), 59 deletions(-) create mode 100644 kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/configuration/MinioConfig.java rename kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/{ => files}/FileSystemImpl.java (97%) rename kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/{ => files}/FileUtilsInterface.java (97%) create mode 100644 kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/KraftwerkApi.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/KraftwerkApi.java index d52cce83..7df38182 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/KraftwerkApi.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/KraftwerkApi.java @@ -1,13 +1,16 @@ package fr.insee.kraftwerk.api; +import fr.insee.kraftwerk.api.configuration.MinioConfig; import org.springframework.boot.SpringApplication; import org.springframework.boot.autoconfigure.SpringBootApplication; import org.springframework.boot.builder.SpringApplicationBuilder; import org.springframework.boot.context.properties.ConfigurationPropertiesScan; +import org.springframework.boot.context.properties.EnableConfigurationProperties; import org.springframework.boot.web.servlet.support.SpringBootServletInitializer; @SpringBootApplication @ConfigurationPropertiesScan +@EnableConfigurationProperties(MinioConfig.class) public class KraftwerkApi extends SpringBootServletInitializer { diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java index 2b363615..b0864677 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java @@ -1,10 +1,12 @@ package fr.insee.kraftwerk.api.batch; import fr.insee.kraftwerk.api.configuration.ConfigProperties; +import fr.insee.kraftwerk.api.configuration.MinioConfig; import fr.insee.kraftwerk.api.process.MainProcessing; import fr.insee.kraftwerk.api.process.MainProcessingGenesis; import fr.insee.kraftwerk.api.services.KraftwerkService; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.MinioImpl; +import io.minio.MinioClient; import lombok.extern.slf4j.Slf4j; import org.springframework.beans.factory.annotation.Autowired; import org.springframework.beans.factory.annotation.Value; @@ -14,12 +16,10 @@ @Component @Slf4j public class KraftwerkBatch implements CommandLineRunner { - @Autowired - public KraftwerkBatch(ConfigProperties configProperties) { - this.configProperties = configProperties; - } ConfigProperties configProperties; + MinioConfig minioConfig; + MinioClient minioClient; @Value("${fr.insee.postcollecte.files}") protected String defaultDirectory; @@ -27,6 +27,15 @@ public KraftwerkBatch(ConfigProperties configProperties) { @Value("${fr.insee.postcollecte.size-limit}") protected long limitSize; + @Autowired + public KraftwerkBatch(ConfigProperties configProperties, MinioConfig minioConfig) { + this.configProperties = configProperties; + this.minioConfig = minioConfig; + if(minioConfig.isEnable()){ + minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); + } + } + @Override public void run(String... args) throws Exception{ //If .jar launched with cli args @@ -55,17 +64,17 @@ public void run(String... args) throws Exception{ //Run kraftwerk if(kraftwerkServiceType == KraftwerkServiceType.GENESIS){ - MainProcessingGenesis mainProcessingGenesis = new MainProcessingGenesis(configProperties, new FileSystemImpl()); + MainProcessingGenesis mainProcessingGenesis = new MainProcessingGenesis(configProperties, new MinioImpl(minioClient, minioConfig.getBucketName())); mainProcessingGenesis.runMain(inDirectory); }else{ - MainProcessing mainProcessing = new MainProcessing(inDirectory, fileByFile, withAllReportingData, withDDI, defaultDirectory, limitSize, new FileSystemImpl()); + MainProcessing mainProcessing = new MainProcessing(inDirectory, fileByFile, withAllReportingData, withDDI, defaultDirectory, limitSize, new MinioImpl(minioClient, minioConfig.getBucketName())); mainProcessing.runMain(); } //Archive if(Boolean.TRUE.equals(archiveAtEnd)){ KraftwerkService kraftwerkService = new KraftwerkService(); - kraftwerkService.archive(inDirectory, new FileSystemImpl()); + kraftwerkService.archive(inDirectory, new MinioImpl(minioClient, minioConfig.getBucketName())); } System.exit(0); diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/configuration/MinioConfig.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/configuration/MinioConfig.java new file mode 100644 index 00000000..1bd8e6b2 --- /dev/null +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/configuration/MinioConfig.java @@ -0,0 +1,15 @@ +package fr.insee.kraftwerk.api.configuration; + +import lombok.Getter; +import org.springframework.boot.context.properties.ConfigurationProperties; + +@ConfigurationProperties(prefix = "fr.insee.postcollecte.minio") +@Getter +public class MinioConfig { + private String endpoint; + private String accessKey; + private String secretKey; + private boolean enable; + + private String bucketName; +} diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java index 133abdf4..407a504a 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java @@ -7,7 +7,7 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.metadata.MetadataUtils; import fr.insee.kraftwerk.core.sequence.*; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.kraftwerk.core.utils.log.KraftwerkExecutionLog; import fr.insee.kraftwerk.core.vtl.VtlBindings; diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java index a15c0702..dc86bbde 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java @@ -15,7 +15,7 @@ import fr.insee.kraftwerk.core.sequence.MultimodalSequence; import fr.insee.kraftwerk.core.sequence.UnimodalSequence; import fr.insee.kraftwerk.core.sequence.WriterSequence; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.Getter; diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java index ec7126b0..1b05c0c6 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java @@ -4,7 +4,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.sequence.ControlInputSequence; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import io.swagger.v3.oas.annotations.responses.ApiResponse; import io.swagger.v3.oas.annotations.responses.ApiResponses; import jakarta.annotation.PostConstruct; diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java index c8670742..e8a1ddf1 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java @@ -2,12 +2,15 @@ import fr.insee.kraftwerk.api.configuration.ConfigProperties; +import fr.insee.kraftwerk.api.configuration.MinioConfig; import fr.insee.kraftwerk.api.process.MainProcessing; import fr.insee.kraftwerk.api.process.MainProcessingGenesis; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.sequence.ControlInputSequenceGenesis; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.MinioImpl; +import io.minio.MinioClient; import io.swagger.v3.oas.annotations.Operation; import io.swagger.v3.oas.annotations.Parameter; import io.swagger.v3.oas.annotations.tags.Tag; @@ -27,10 +30,16 @@ public class MainService extends KraftwerkService { ConfigProperties configProperties; + MinioConfig minioConfig; + MinioClient minioClient; @Autowired - public MainService(ConfigProperties configProperties) { + public MainService(ConfigProperties configProperties, MinioConfig minioConfig) { this.configProperties = configProperties; + this.minioConfig = minioConfig; + if(minioConfig.isEnable()){ + minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); + } } @PutMapping(value = "/main") @@ -42,7 +51,12 @@ public ResponseEntity mainService( ) { boolean fileByFile = false; boolean withDDI = true; - FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + FileUtilsInterface fileUtilsInterface; + if(Boolean.TRUE.equals(minioConfig.isEnable())){ + fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + }else{ + fileUtilsInterface = new FileSystemImpl(); + } MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize, fileUtilsInterface); try { @@ -66,7 +80,12 @@ public ResponseEntity mainFileByFile( boolean fileByFile = true; boolean withAllReportingData = false; boolean withDDI = true; - FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + FileUtilsInterface fileUtilsInterface; + if(Boolean.TRUE.equals(minioConfig.isEnable())){ + fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + }else{ + fileUtilsInterface = new FileSystemImpl(); + } MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize, fileUtilsInterface); try { @@ -89,7 +108,12 @@ public ResponseEntity mainLunaticOnly( boolean withDDI = false; boolean fileByFile = false; boolean withAllReportingData = false; - FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + FileUtilsInterface fileUtilsInterface; + if(Boolean.TRUE.equals(minioConfig.isEnable())){ + fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + }else{ + fileUtilsInterface = new FileSystemImpl(); + } MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize, fileUtilsInterface); try { @@ -107,7 +131,13 @@ public ResponseEntity mainLunaticOnly( @Operation(operationId = "mainGenesis", summary = "${summary.mainGenesis}", description = "${description.mainGenesis}") public ResponseEntity mainGenesis( @Parameter(description = "${param.idCampaign}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String idCampaign) { - FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + FileUtilsInterface fileUtilsInterface; + if(Boolean.TRUE.equals(minioConfig.isEnable())){ + fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + }else{ + fileUtilsInterface = new FileSystemImpl(); + } + MainProcessingGenesis mpGenesis = new MainProcessingGenesis(configProperties, fileUtilsInterface); try { diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java index ea4ff382..7a0c93f0 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java @@ -14,7 +14,7 @@ @Tag(name = "${tag.splitter}") @Log4j2 public class SplitterService extends KraftwerkService{ - +//TODO add MinIO support @Operation(summary = "Split a XML file into smaller ones") @PutMapping(path = "/split/lunatic-xml") public ResponseEntity saveResponsesFromXmlFile(@RequestParam("inputFolder") String inputFolder, diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java index c3591a93..511d896f 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java @@ -1,5 +1,6 @@ package fr.insee.kraftwerk.api.services; +import fr.insee.kraftwerk.api.configuration.MinioConfig; import fr.insee.kraftwerk.api.process.MainProcessing; import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.dataprocessing.StepEnum; @@ -9,13 +10,16 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.metadata.MetadataUtils; import fr.insee.kraftwerk.core.sequence.*; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.MinioImpl; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.kraftwerk.core.vtl.VtlBindings; +import io.minio.MinioClient; import io.swagger.v3.oas.annotations.Operation; import io.swagger.v3.oas.annotations.Parameter; import io.swagger.v3.oas.annotations.tags.Tag; +import org.springframework.beans.factory.annotation.Autowired; import org.springframework.http.ResponseEntity; import org.springframework.web.bind.annotation.*; @@ -31,6 +35,16 @@ @RestController @Tag(name = "${tag.stepbystep}") public class StepByStepService extends KraftwerkService { + MinioConfig minioConfig; + MinioClient minioClient; + + @Autowired + public StepByStepService(MinioConfig minioConfig) { + this.minioConfig = minioConfig; + if(minioConfig.isEnable()){ + minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); + } + } @PutMapping(value = "/buildVtlBindings") @Operation(operationId = "buildVtlBindings", summary = "${summary.buildVtlBindings}", description = "${description.buildVtlBindings}") @@ -41,7 +55,12 @@ public ResponseEntity buildVtlBindings( //Read data files boolean fileByFile = false; boolean withDDI = true; - FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + FileUtilsInterface fileUtilsInterface; + if(Boolean.TRUE.equals(minioConfig.isEnable())){ + fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + }else{ + fileUtilsInterface = new FileSystemImpl(); + } MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize, fileUtilsInterface); try { @@ -80,7 +99,12 @@ public ResponseEntity buildVtlBindingsByDataMode( //Read data files boolean fileByFile = false; boolean withDDI = true; - FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + FileUtilsInterface fileUtilsInterface; + if(Boolean.TRUE.equals(minioConfig.isEnable())){ + fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + }else{ + fileUtilsInterface = new FileSystemImpl(); + } MainProcessing mp = new MainProcessing(inDirectoryParam, fileByFile,withAllReportingData,withDDI, defaultDirectory, limitSize, fileUtilsInterface); try { @@ -112,7 +136,12 @@ public ResponseEntity unimodalProcessing( @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam, @Parameter(description = "${param.dataMode}", required = true) @RequestParam String dataMode ) { - FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + FileUtilsInterface fileUtilsInterface; + if(Boolean.TRUE.equals(minioConfig.isEnable())){ + fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + }else{ + fileUtilsInterface = new FileSystemImpl(); + } //Read data in JSON file Path inDirectory; @@ -155,7 +184,12 @@ public ResponseEntity unimodalProcessing( public ResponseEntity multimodalProcessing( @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam ) { - FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + FileUtilsInterface fileUtilsInterface; + if(Boolean.TRUE.equals(minioConfig.isEnable())){ + fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + }else{ + fileUtilsInterface = new FileSystemImpl(); + } //Read data in JSON file Path inDirectory; @@ -203,7 +237,12 @@ public ResponseEntity multimodalProcessing( public ResponseEntity writeOutputFiles( @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam ) throws KraftwerkException { - FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + FileUtilsInterface fileUtilsInterface; + if(Boolean.TRUE.equals(minioConfig.isEnable())){ + fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + }else{ + fileUtilsInterface = new FileSystemImpl(); + } Path inDirectory; try { @@ -242,7 +281,12 @@ public ResponseEntity writeOutputFiles( @Operation(operationId = "archive", summary = "${summary.archive}", description = "${description.archive}") public ResponseEntity archiveService( @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam) { - FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); //TODO Minio if kube + FileUtilsInterface fileUtilsInterface; + if(Boolean.TRUE.equals(minioConfig.isEnable())){ + fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + }else{ + fileUtilsInterface = new FileSystemImpl(); + } return archive(inDirectoryParam, fileUtilsInterface); } diff --git a/kraftwerk-core/pom.xml b/kraftwerk-core/pom.xml index 009e2705..db8575a0 100644 --- a/kraftwerk-core/pom.xml +++ b/kraftwerk-core/pom.xml @@ -225,6 +225,13 @@ commons-compress 1.26.2 + + + + io.minio + minio + 8.5.10 + \ No newline at end of file diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputs.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputs.java index 99fde59a..fc9c297d 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputs.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputs.java @@ -1,6 +1,6 @@ package fr.insee.kraftwerk.core.inputs; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.Getter; import lombok.Setter; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java index 9a280407..d941c332 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java @@ -4,7 +4,7 @@ import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.exceptions.MissingMandatoryFieldException; import fr.insee.kraftwerk.core.exceptions.UnknownDataFormatException; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.JsonFileReader; import lombok.Getter; import lombok.Setter; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java index 81048103..99a5869b 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java @@ -6,7 +6,7 @@ import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.exceptions.MissingMandatoryFieldException; import fr.insee.kraftwerk.core.exceptions.UnknownDataFormatException; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.JsonFileReader; import lombok.extern.log4j.Log4j2; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java index a5f52b31..08aec114 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java @@ -4,7 +4,7 @@ import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.metadata.MetadataModel; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.Getter; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java index e39b0354..53674eb3 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java @@ -15,7 +15,7 @@ import fr.insee.kraftwerk.core.rawdata.GroupInstance; import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java index d83af81e..6e941eea 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java @@ -7,7 +7,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.inputs.UserInputsFile; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; @Log4j2 diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/MultimodalSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/MultimodalSequence.java index 4bca68c9..f37f8bb0 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/MultimodalSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/MultimodalSequence.java @@ -12,7 +12,7 @@ import fr.insee.kraftwerk.core.dataprocessing.ReconciliationProcessing; import fr.insee.kraftwerk.core.inputs.UserInputs; import fr.insee.kraftwerk.core.metadata.MetadataModel; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.NoArgsConstructor; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java index 0dbc6f98..2d4d44f7 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java @@ -6,7 +6,7 @@ import fr.insee.kraftwerk.core.inputs.ModeInputs; import fr.insee.kraftwerk.core.inputs.UserInputs; import fr.insee.kraftwerk.core.metadata.*; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.NoArgsConstructor; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/VtlReaderWriterSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/VtlReaderWriterSequence.java index 9263217c..93363d78 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/VtlReaderWriterSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/VtlReaderWriterSequence.java @@ -4,7 +4,7 @@ import java.nio.file.Path; import fr.insee.kraftwerk.core.dataprocessing.StepEnum; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java index f73a4290..6ddc9a6f 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java @@ -7,7 +7,7 @@ import fr.insee.kraftwerk.core.outputs.OutputFiles; import fr.insee.kraftwerk.core.outputs.csv.CsvOutputFiles; import fr.insee.kraftwerk.core.outputs.parquet.ParquetOutputFiles; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.log.KraftwerkExecutionLog; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.NoArgsConstructor; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java index 5fbfa75c..9f0f2f78 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java @@ -8,6 +8,8 @@ import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.Constants; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.log.KraftwerkExecutionLog; import lombok.extern.log4j.Log4j2; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java index e5f4ff56..0ecb43db 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java @@ -1,5 +1,7 @@ package fr.insee.kraftwerk.core.utils; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; + import javax.xml.stream.*; import javax.xml.stream.events.EndDocument; import javax.xml.stream.events.StartDocument; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java similarity index 97% rename from kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileSystemImpl.java rename to kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index 49d9e416..aec7d64d 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -1,9 +1,10 @@ -package fr.insee.kraftwerk.core.utils; +package fr.insee.kraftwerk.core.utils.files; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.inputs.ModeInputs; import fr.insee.kraftwerk.core.inputs.UserInputs; import fr.insee.kraftwerk.core.inputs.UserInputsFile; +import fr.insee.kraftwerk.core.utils.DateUtils; import lombok.NoArgsConstructor; import lombok.extern.log4j.Log4j2; @@ -31,8 +32,8 @@ public class FileSystemImpl implements FileUtilsInterface{ /** * Move the input file to another directory to archive it */ + @Override public void renameInputFile(Path inDirectory) { - File file = inDirectory.resolve("kraftwerk.json").toFile(); String fileWithTime = "kraftwerk-" + DateUtils.getCurrentTimeStamp() + ".json"; File file2 = inDirectory.resolve(fileWithTime).toFile(); @@ -50,6 +51,7 @@ public void renameInputFile(Path inDirectory) { } } + @Override public void archiveInputFiles(UserInputsFile userInputsFile) throws KraftwerkException { // Path inputFolder = userInputsFile.getInputDirectory(); @@ -160,8 +162,8 @@ private String getRoot(Path path, String campaignName) { } return result.toString(); } - - + + @Override public void deleteDirectory(Path directoryPath) throws KraftwerkException { try { org.springframework.util.FileSystemUtils.deleteRecursively(directoryPath); @@ -175,13 +177,15 @@ public void deleteDirectory(Path directoryPath) throws KraftwerkException { * @param dir * @return */ + @Override public List listFiles(String dir) { return Stream.of(new File(dir).listFiles()) .filter(file -> !file.isDirectory()) .map(File::getName) .toList(); } - + + @Override public Path getTempVtlFilePath(UserInputs userInputs, String step, String dataset) { createDirectoryIfNotExist(FileUtilsInterface.transformToTemp(userInputs.getInputDirectory())); return FileUtilsInterface.transformToTemp(userInputs.getInputDirectory()).resolve(step+ dataset+".vtl"); @@ -196,6 +200,7 @@ public static void createDirectoryIfNotExist(Path path) { } } + @Override public Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException { if (userField != null && !"null".equals(userField) && !userField.isEmpty()) { Path inputPath = inputDirectory.resolve(userField); @@ -208,6 +213,7 @@ public Path convertToPath(String userField, Path inputDirectory) throws Kraftwer } } + @Override public URL convertToUrl(String userField, Path inputDirectory) { if (userField == null) { log.debug("null value out of method that reads DDI field (should not happen)."); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileUtilsInterface.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java similarity index 97% rename from kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileUtilsInterface.java rename to kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java index 2b221d53..f9bcbb1b 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/FileUtilsInterface.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java @@ -1,4 +1,4 @@ -package fr.insee.kraftwerk.core.utils; +package fr.insee.kraftwerk.core.utils.files; import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java new file mode 100644 index 00000000..cfdc90aa --- /dev/null +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -0,0 +1,253 @@ +package fr.insee.kraftwerk.core.utils.files; + +import fr.insee.kraftwerk.core.exceptions.KraftwerkException; +import fr.insee.kraftwerk.core.inputs.ModeInputs; +import fr.insee.kraftwerk.core.inputs.UserInputs; +import fr.insee.kraftwerk.core.inputs.UserInputsFile; +import fr.insee.kraftwerk.core.utils.DateUtils; +import io.minio.CopyObjectArgs; +import io.minio.CopySource; +import io.minio.GetObjectArgs; +import io.minio.ListObjectsArgs; +import io.minio.MinioClient; +import io.minio.PutObjectArgs; +import io.minio.RemoveObjectArgs; +import io.minio.Result; +import io.minio.StatObjectArgs; +import io.minio.errors.ErrorResponseException; +import io.minio.messages.Item; +import lombok.AllArgsConstructor; +import lombok.extern.slf4j.Slf4j; + +import java.io.File; +import java.io.InputStream; +import java.net.MalformedURLException; +import java.net.URI; +import java.net.URISyntaxException; +import java.net.URL; +import java.nio.file.Path; +import java.util.ArrayList; +import java.util.Arrays; +import java.util.List; +import java.util.regex.Pattern; + +@Slf4j +@AllArgsConstructor +public class MinioImpl implements FileUtilsInterface { + + private static final String ARCHIVE = "Archive"; + + MinioClient minioClient; + String bucketName; + + + @Override + public void renameInputFile(Path inDirectory) { + String file1MinioPathString = inDirectory.resolve("/kraftwerk.json").toString(); + String fileWithTime = "kraftwerk-" + DateUtils.getCurrentTimeStamp() + ".json"; + String file2MinioPathString = inDirectory.resolve(fileWithTime).toString(); + if (isObjectExist(file2MinioPathString)) { + log.warn(String.format("Trying to rename '%s' to '%s', but second file already exists.", Path.of(file1MinioPathString).getFileName(), Path.of(file2MinioPathString).getFileName())); + log.warn("Timestamped input file will be over-written."); + deleteFile(file2MinioPathString); + } + moveFile(file1MinioPathString, file2MinioPathString); + } + + @Override + public void archiveInputFiles(UserInputsFile userInputsFile) throws KraftwerkException { + // + Path inputFolder = userInputsFile.getInputDirectory(); + String[] directories = inputFolder.toString().split(Pattern.quote(File.separator)); + String campaignName = directories[directories.length - 1]; + + // + for (String mode : userInputsFile.getModes()) { + ModeInputs modeInputs = userInputsFile.getModeInputs(mode); + archiveData(inputFolder, campaignName, modeInputs); + archiveParadata(inputFolder, campaignName, modeInputs); + archiveReportingData(inputFolder, campaignName, modeInputs); + } + } + + private void archiveData(Path inputFolder, String campaignName, ModeInputs modeInputs) { + Path dataPath = modeInputs.getDataFile(); + Path newDataPath = inputFolder.resolve(ARCHIVE).resolve(getRoot(dataPath, campaignName)); + + if (!isDirectory(dataPath.toString())) { + moveFile(dataPath.toString(), newDataPath.toString()); + } else { + moveDirectory(dataPath.toString(), newDataPath.toString()); + } + } + + /** + * If paradata, we move the paradata folder + */ + private void archiveParadata(Path inputFolder, String campaignName, ModeInputs modeInputs){ + if (modeInputs.getParadataFolder() != null) { + moveDirectory(modeInputs.getParadataFolder().toString(), inputFolder.resolve(ARCHIVE) + .resolve(getRoot(modeInputs.getParadataFolder(), campaignName)).toString()); + } + } + + /** + * If reporting data, we move reporting data files + */ + private void archiveReportingData(Path inputFolder, String campaignName, ModeInputs modeInputs){ + if (modeInputs.getReportingDataFile() != null) { + moveDirectory(modeInputs.getReportingDataFile().toString(), inputFolder.resolve(ARCHIVE) + .resolve(getRoot(modeInputs.getReportingDataFile(), campaignName)).toString()); + } + } + + private String getRoot(Path path, String campaignName) { + String[] directories = path.toString().split(Pattern.quote(File.separator)); + int campaignIndex = Arrays.asList(directories).indexOf(campaignName); + String[] newDirectories = Arrays.copyOfRange(directories, campaignIndex + 1, directories.length); + StringBuilder result = new StringBuilder(); + String sep = ""; + for (String directory : newDirectories) { + result.append(sep).append(directory); + sep = File.separator; + } + return result.toString(); + } + + @Override + public void deleteDirectory(Path directoryPath) throws KraftwerkException { + try { + for (String filePath : listFiles(directoryPath.toString())) { + deleteFile(filePath); + } + } catch (Exception e) { + log.error(e.toString()); + } + } + + @Override + public List listFiles(String dir) { + try { + ArrayList filePaths = new ArrayList<>(); + Iterable> results = minioClient.listObjects( + ListObjectsArgs.builder().bucket(bucketName).prefix(dir).recursive(true).build()); + + for (Result result : results) { + filePaths.add(result.get().objectName()); + } + return filePaths; + } catch (Exception e) { + log.error(e.toString()); + return null; + } + } + + @Override + public Path getTempVtlFilePath(UserInputs userInputs, String step, String dataset) { + return FileUtilsInterface.transformToTemp(userInputs.getInputDirectory()).resolve(step+ dataset+".vtl"); + } + + @Override + public Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException { + if (userField != null && !"null".equals(userField) && !userField.isEmpty()) { + return inputDirectory.resolve(userField); + } else { + return null; + } + } + + @Override + public URL convertToUrl(String userField, Path inputDirectory) { + if (userField == null) { + log.debug("null value out of method that reads DDI field (should not happen)."); + return null; + } + try { + if (userField.startsWith("http")) { + return new URI(userField).toURL(); + } + return inputDirectory.resolve(userField).toFile().toURI().toURL(); + } catch (MalformedURLException | URISyntaxException e) { + log.error("Unable to convert URL from user input: " + userField); + return null; + } + } + + //Utilities + + private InputStream readFile(String minioPath) { + try { + return minioClient.getObject(GetObjectArgs.builder().bucket(bucketName).object(minioPath).build()); + } catch (Exception e) { + log.error(e.toString()); + return null; + } + } + + private void writeFile(String minioPath, InputStream inputStream, int fileSize) { + try { + minioClient.putObject(PutObjectArgs.builder().bucket(bucketName).stream(inputStream, fileSize, -1).object(minioPath).build()); + } catch (Exception e) { + log.error(e.toString()); + } + } + + private void copyFile(String srcMinioPath, String dstMinioPath) { + try { + CopySource copySource = CopySource.builder().bucket(bucketName).object(srcMinioPath).build(); + minioClient.copyObject(CopyObjectArgs.builder().bucket(bucketName).object(dstMinioPath).source(copySource).build()); + } catch (Exception e) { + log.error(e.toString()); + } + } + + private void moveFile(String srcMinioPath, String dstMinioPath) { + try { + copyFile(srcMinioPath, dstMinioPath); + deleteFile(srcMinioPath); + } catch (Exception e) { + log.error(e.toString()); + } + } + + private void moveDirectory(String srcMinioPath, String dstMinioPath) { + try { + for (String filePath : listFiles(srcMinioPath)) { + moveFile(filePath, dstMinioPath + "/" + extractFileName(filePath)); + } + } catch (Exception e) { + log.error(e.toString()); + } + } + + private String extractFileName(String filePath) { + if (filePath == null || filePath.isEmpty()) { + return ""; + } + return Path.of(filePath).getFileName().toString(); + } + + private void deleteFile(String minioPath) { + try { + minioClient.removeObject(RemoveObjectArgs.builder().bucket(bucketName).object(minioPath).build()); + } catch (Exception e) { + log.error(e.toString()); + } + } + + private boolean isObjectExist(String objectPath) { + try { + minioClient.statObject(StatObjectArgs.builder().bucket(bucketName).object(objectPath).build()); + return true; + } catch (ErrorResponseException e) { + return false; + } catch (Exception e) { + log.error(e.toString()); + return false; + } + } + + private boolean isDirectory(String path){ + return path.endsWith("/") || path.endsWith("\\"); + } +} diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java index 64fa9ae0..965757ea 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java @@ -5,7 +5,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.utils.TextFileWriter; import fr.insee.vtl.jackson.TrevasModule; import fr.insee.vtl.model.Dataset; diff --git a/kraftwerk-core/src/main/resources/application.properties b/kraftwerk-core/src/main/resources/application.properties index f9107f66..e4cbcfe2 100644 --- a/kraftwerk-core/src/main/resources/application.properties +++ b/kraftwerk-core/src/main/resources/application.properties @@ -1,4 +1,8 @@ # LOGS logging.level.root= INFO logging.level.fr.insee.kraftwerk=INFO -simpleLogger.defaultLogLevel=INFO \ No newline at end of file +simpleLogger.defaultLogLevel=INFO + +# S3 +# Disabled by default +fr.insee.postcollecte.minio.enable = false \ No newline at end of file diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java index 7e94738e..1d4e4811 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java @@ -10,8 +10,8 @@ import java.nio.file.Path; import java.util.Set; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.Test; import fr.insee.kraftwerk.core.TestConstants; diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesisTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesisTest.java index 2673c45e..85b575d6 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesisTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesisTest.java @@ -4,7 +4,7 @@ import fr.insee.kraftwerk.core.data.model.Mode; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.parsers.DataFormat; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import org.junit.jupiter.api.Test; import java.io.IOException; diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java index c5b8c606..931fb474 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java @@ -10,8 +10,8 @@ import java.util.List; import java.util.Set; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.MethodOrderer.OrderAnnotation; import org.junit.jupiter.api.Order; import org.junit.jupiter.api.Test; diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvTableWriterTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvTableWriterTest.java index de40c28b..61aa8bff 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvTableWriterTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvTableWriterTest.java @@ -9,7 +9,7 @@ import fr.insee.kraftwerk.core.metadata.VariableType; import fr.insee.kraftwerk.core.outputs.csv.CsvTableWriter; import fr.insee.kraftwerk.core.utils.CsvUtils; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.vtl.model.Dataset; import fr.insee.vtl.model.Dataset.Role; import fr.insee.vtl.model.InMemoryDataset; diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java index e807a8c7..a3fac601 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java @@ -8,8 +8,8 @@ import fr.insee.kraftwerk.core.metadata.Variable; import fr.insee.kraftwerk.core.metadata.VariableType; import fr.insee.kraftwerk.core.outputs.parquet.ParquetOutputFiles; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.vtl.model.Dataset; import fr.insee.vtl.model.Dataset.Role; diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java index cb1d3999..79f36de8 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java @@ -7,8 +7,8 @@ import fr.insee.kraftwerk.core.metadata.UcqVariable; import fr.insee.kraftwerk.core.metadata.Variable; import fr.insee.kraftwerk.core.metadata.VariableType; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import org.junit.jupiter.api.Test; import org.junit.jupiter.params.ParameterizedTest; diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileSystemImplTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileSystemImplTest.java index c6e3ad0d..baee18ad 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileSystemImplTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileSystemImplTest.java @@ -4,6 +4,8 @@ import fr.insee.kraftwerk.core.TestConstants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.inputs.UserInputsFile; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.api.Test; diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XMLSplitterTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XMLSplitterTest.java index 7cec33fd..ea3835a6 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XMLSplitterTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XMLSplitterTest.java @@ -1,6 +1,8 @@ package fr.insee.kraftwerk.core.utils; import fr.insee.kraftwerk.core.TestConstants; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.api.DisplayName; import org.junit.jupiter.api.Test; diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java index 612ff805..f2dcb25a 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java @@ -15,8 +15,8 @@ import fr.insee.kraftwerk.core.outputs.csv.CsvOutputFiles; import fr.insee.kraftwerk.core.sequence.*; import fr.insee.kraftwerk.core.utils.CsvUtils; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; import io.cucumber.java.Before; diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java index 5f91aab4..eacedeee 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java @@ -13,8 +13,8 @@ import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.sequence.ControlInputSequence; -import fr.insee.kraftwerk.core.utils.FileSystemImpl; -import fr.insee.kraftwerk.core.utils.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import io.cucumber.java.en.Given; import io.cucumber.java.en.Then; import io.cucumber.java.en.When; From a7534c0b2d9c9d7d098740e15ac4bf12e23ea041 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 21 Jun 2024 09:13:42 +0200 Subject: [PATCH 16/46] Added TODOS to remove Files methods to use interface instead --- .../kraftwerk/api/process/MainProcessing.java | 27 +++++++--------- .../extradata/paradata/ParadataParser.java | 2 +- .../core/inputs/UserInputsGenesis.java | 1 + .../kraftwerk/core/metadata/DDIReader.java | 1 + .../core/outputs/parquet/LocalOutputFile.java | 1 + .../kraftwerk/core/parsers/DataParser.java | 1 + .../core/sequence/ControlInputSequence.java | 3 +- .../sequence/ControlInputSequenceGenesis.java | 1 + .../core/sequence/WriterSequence.java | 2 +- .../core/utils/files/FileSystemImpl.java | 29 +++++++++++++++++ .../core/utils/files/FileUtilsInterface.java | 18 +++++++++++ .../kraftwerk/core/utils/files/MinioImpl.java | 31 ++++++++++++++++--- .../insee/kraftwerk/core/vtl/VtlExecute.java | 2 +- 13 files changed, 94 insertions(+), 25 deletions(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java index 407a504a..22ca7a48 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java @@ -13,16 +13,12 @@ import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.Getter; import lombok.extern.log4j.Log4j2; -import org.apache.commons.io.FileUtils; -import java.io.IOException; -import java.nio.file.Files; import java.nio.file.Path; import java.time.LocalDateTime; import java.util.ArrayList; import java.util.List; import java.util.Map; -import java.util.stream.Stream; @Log4j2 public class MainProcessing { @@ -195,26 +191,25 @@ private static List getFilesToProcess(UserInputsFile userInputsFile, Strin log.error("Datapath is null"); return files; } - if (Files.isRegularFile(dataPath)) { - files.add(dataPath); - } else if (Files.isDirectory(dataPath)) { - try (Stream stream = Files.list(dataPath)) { - stream.forEach(files::add); - } catch (IOException e) { - log.error(String.format("IOException occurred when trying to list data files of folder: %s", - dataPath)); - } - } else { + if(userInputsFile.getFileUtilsInterface().isDirectory(dataPath.toString()) == null){ log.warn(String.format("Data path given could not be identified as a file or folder: %s", dataPath)); + return files; + } + if(userInputsFile.getFileUtilsInterface().isDirectory(dataPath.toString())){ + for(String path : userInputsFile.getFileUtilsInterface().listFiles(dataPath.toString())){ + files.add(Path.of(path)); + } + }else{ + files.add(dataPath); } return files; } private void isDataTooBig(UserInputsFile userInputsFile, String errorMessage, long limitSize) throws KraftwerkException { for (String dataMode : userInputsFile.getModeInputsMap().keySet()){ - long dataSize = FileUtils.sizeOf(userInputsFile.getModeInputs(dataMode).getDataFile().toFile()); + long dataSize = userInputsFile.getFileUtilsInterface().getSizeOf(userInputsFile.getModeInputs(dataMode).getDataFile().toString()); if (dataSize > limitSize) { - log.error("Size of data folder/file {} : {}",userInputsFile.getModeInputs(dataMode).getDataFile(), FileUtils.byteCountToDisplaySize(dataSize)); + log.error("Size of data folder/file {} : {}",userInputsFile.getModeInputs(dataMode).getDataFile(), dataSize); throw new KraftwerkException(413,errorMessage); } } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/paradata/ParadataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/paradata/ParadataParser.java index 18c1331e..4238ebb9 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/paradata/ParadataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/paradata/ParadataParser.java @@ -35,7 +35,7 @@ public void parseParadata(Paradata paradata, SurveyRawData surveyRawData) throws throw new NullException("JSONFile not defined"); if (!filePath.toString().contentEquals("")) { - +//TODO Change to interface // Get all filepaths for each ParadataUE try (Stream walk = Files.walk(filePath)) { List listFilePaths = walk.filter(Files::isRegularFile) diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java index 99a5869b..6dace939 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java @@ -107,6 +107,7 @@ private String readField(JsonNode node, String field) throws MissingMandatoryFie * @throws IOException – if an I/O error is thrown when accessing the starting file */ public Path findDDIFile(Path specDirectory) throws KraftwerkException, IOException { + //TODO Change to interface try (Stream files = Files.find(specDirectory, 1, (path, basicFileAttributes) -> path.toFile().getName().toLowerCase().matches("ddi[\\w,\\s-]+\\.xml"))) { return files.findFirst() .orElseThrow(() -> new KraftwerkException(404, "No DDI file (ddi*.xml) found in " + specDirectory.toString())); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java index 83c84fdb..9600f71c 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java @@ -54,6 +54,7 @@ public static MetadataModel getMetadataFromDDI(URL ddiUrl) throws KraftwerkExcep transformDDI(ddiUrl, variablesTempFilePath); MetadataModel metadataModel = readVariables(variablesTempFilePath); + //TODO change to use interface Files.delete(variablesFile.toPath()); return metadataModel; } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/LocalOutputFile.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/LocalOutputFile.java index 813a7d42..64a18f13 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/LocalOutputFile.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/LocalOutputFile.java @@ -41,6 +41,7 @@ private class LocalPositionOutputStream extends PositionOutputStream { public LocalPositionOutputStream(int buffer, StandardOpenOption... openOption) throws IOException { stream = new BufferedOutputStream(Files.newOutputStream(path, openOption), buffer); + //TODO Change to interface } @Override diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParser.java index 6f7666fa..e0f8b04d 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParser.java @@ -42,6 +42,7 @@ public final void parseSurveyData(Path dataPath, KraftwerkExecutionLog kraftwerk log.error(DATAPATH_IS_NULL); throw new NullException(DATAPATH_IS_NULL); } + //TODO change to use interface if (Files.isRegularFile(dataPath)) { parseDataFile(dataPath); if(kraftwerkExecutionLog != null) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java index 6e941eea..05ea2e8b 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java @@ -30,7 +30,8 @@ public Path getInDirectory(String inDirectoryParam) throws KraftwerkException { if (!verifyInDirectory(inDirectory)) throw new KraftwerkException(400, "Configuration file not found"); return inDirectory; } - + + //TODO Change to interface private boolean verifyInDirectory(Path inDirectory) { Path userInputFile = inDirectory.resolve(Constants.USER_INPUT_FILE); if (Files.exists(userInputFile)) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequenceGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequenceGenesis.java index 988feed7..d3517ab1 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequenceGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequenceGenesis.java @@ -30,6 +30,7 @@ public Path getInDirectory(String inDirectoryParam) { private boolean verifyInDirectory(Path inDirectory) { Path userInputFile = inDirectory.resolve(Constants.USER_INPUT_FILE); + //TODO change to use interface if (Files.exists(userInputFile)) { log.info(String.format("Found configuration file in campaign folder: %s", userInputFile)); } else { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java index 6ddc9a6f..4bb10630 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java @@ -30,7 +30,7 @@ public void writeOutputFiles(Path inDirectory, LocalDateTime localDateTime, VtlB /* Step 4.1 : write csv output tables */ OutputFiles csvOutputFiles = new CsvOutputFiles(outDirectory, vtlBindings, new ArrayList<>(modeInputsMap.keySet()),kraftwerkExecutionLog); csvOutputFiles.writeOutputTables(metadataModels); - +//TODO change to use interface /* Step 4.2 : write scripts to import csv tables in several languages */ csvOutputFiles.writeImportScripts(metadataModels, errors); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index aec7d64d..46d2cd48 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -7,7 +7,9 @@ import fr.insee.kraftwerk.core.utils.DateUtils; import lombok.NoArgsConstructor; import lombok.extern.log4j.Log4j2; +import org.apache.commons.io.FileUtils; +import javax.annotation.Nullable; import java.io.File; import java.io.IOException; import java.net.MalformedURLException; @@ -16,6 +18,7 @@ import java.net.URL; import java.nio.file.Files; import java.nio.file.Path; +import java.nio.file.StandardOpenOption; import java.util.Arrays; import java.util.List; import java.util.regex.Pattern; @@ -229,4 +232,30 @@ public URL convertToUrl(String userField, Path inputDirectory) { return null; } } + + @Override + @Nullable + public Boolean isDirectory(String path) { + if(!Files.isRegularFile(Path.of(path))){ + return null; + } + File file = new File(path); + return file.isDirectory(); + } + + @Override + public long getSizeOf(String path) { + File file = new File(path); + return FileUtils.sizeOf(file); + } + + @Override + public void writeFile(String path, String toWrite, boolean replace) { + StandardOpenOption standardOpenOption = replace ? StandardOpenOption.TRUNCATE_EXISTING : StandardOpenOption.APPEND; + try { + Files.write(Path.of(path), toWrite.getBytes(), standardOpenOption); + }catch (IOException e){ + log.error(e.toString()); + } + } } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java index f9bcbb1b..d22ff658 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java @@ -5,6 +5,7 @@ import fr.insee.kraftwerk.core.inputs.UserInputs; import fr.insee.kraftwerk.core.inputs.UserInputsFile; +import javax.annotation.Nullable; import java.net.URL; import java.nio.file.Path; import java.time.LocalDateTime; @@ -48,4 +49,21 @@ private static Path transformToOther(Path inDirectory, String other) { Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException; URL convertToUrl(String userField, Path inputDirectory); + + /** + * + * @param path path of file + * @return true if directory, false if file, null if neither + */ + @Nullable + Boolean isDirectory(String path); + + /** + * + * @param path path of file + * @return size of file + */ + long getSizeOf(String path); + + void writeFile(String path, String toWrite, boolean replace); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java index cfdc90aa..6796eed8 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -14,11 +14,13 @@ import io.minio.RemoveObjectArgs; import io.minio.Result; import io.minio.StatObjectArgs; +import io.minio.StatObjectResponse; import io.minio.errors.ErrorResponseException; import io.minio.messages.Item; import lombok.AllArgsConstructor; import lombok.extern.slf4j.Slf4j; +import java.io.ByteArrayInputStream; import java.io.File; import java.io.InputStream; import java.net.MalformedURLException; @@ -173,6 +175,29 @@ public URL convertToUrl(String userField, Path inputDirectory) { } } + @Override + public Boolean isDirectory(String path){ + return path.endsWith("/") || path.endsWith("\\"); + } + + @Override + public long getSizeOf(String path) { + try { + StatObjectResponse objectStat = minioClient.statObject(StatObjectArgs.builder().bucket(bucketName).object(path).build()); + return objectStat.size(); + }catch (Exception e){ + log.error(e.toString()); + return 0; + } + } + + @Override + public void writeFile(String path, String toWrite, boolean replace) { + InputStream inputStream = new ByteArrayInputStream(toWrite.getBytes()); + writeFileOnMinio(path, inputStream, toWrite.length()); + } + + //Utilities private InputStream readFile(String minioPath) { @@ -184,7 +209,7 @@ private InputStream readFile(String minioPath) { } } - private void writeFile(String minioPath, InputStream inputStream, int fileSize) { + private void writeFileOnMinio(String minioPath, InputStream inputStream, int fileSize) { try { minioClient.putObject(PutObjectArgs.builder().bucket(bucketName).stream(inputStream, fileSize, -1).object(minioPath).build()); } catch (Exception e) { @@ -246,8 +271,4 @@ private boolean isObjectExist(String objectPath) { return false; } } - - private boolean isDirectory(String path){ - return path.endsWith("/") || path.endsWith("\\"); - } } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java index 965757ea..e24b8999 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java @@ -67,7 +67,7 @@ public void convertToVtlDataset(SurveyRawData surveyRawData, String bindingName, Path tempDataset = Paths.get(tempDatasetPath); try { - Files.delete(tempDataset); + Files.delete(tempDataset); //TODO Change to use interface log.debug("File {} deleted",tempDatasetPath); } catch (IOException e) { log.debug("Impossible to delete file {}",tempDatasetPath); From 027abcb136416e19bf15b951b55138d860ccc8f5 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 21 Jun 2024 10:39:48 +0200 Subject: [PATCH 17/46] Fixes after merge --- .../kraftwerk/api/process/MainProcessing.java | 5 +++-- kraftwerk-core/pom.xml | 2 +- .../core/sequence/WriterSequence.java | 4 ++-- .../core/utils/files/FileSystemImpl.java | 17 +++++++++++--- .../core/utils/files/FileUtilsInterface.java | 2 ++ .../kraftwerk/core/utils/files/MinioImpl.java | 22 ++++++++++++++++++- .../core/outputs/CsvOutputFilesTest.java | 7 +++--- .../core/outputs/ParquetOutputFilesTest.java | 1 - .../kraftwerk/core/utils/SqlUtilsTest.java | 4 +++- .../functional_tests/MainDefinitions.java | 7 +++--- 10 files changed, 53 insertions(+), 18 deletions(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java index 490f50f4..b3768ccb 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java @@ -199,6 +199,7 @@ private static List getUserInputsFile(UserInputsFile source, boo return userInputsFileList; } + //TODO FIX HERE private static List getFilesToProcess(UserInputsFile userInputsFile, String dataMode) { List files = new ArrayList<>(); ModeInputs modeInputs = userInputsFile.getModeInputs(dataMode); @@ -211,8 +212,8 @@ private static List getFilesToProcess(UserInputsFile userInputsFile, Strin log.warn(String.format("Data path given could not be identified as a file or folder: %s", dataPath)); return files; } - if(userInputsFile.getFileUtilsInterface().isDirectory(dataPath.toString())){ - for(String path : userInputsFile.getFileUtilsInterface().listFiles(dataPath.toString())){ + if(Boolean.TRUE.equals(userInputsFile.getFileUtilsInterface().isDirectory(dataPath.toString()))){ + for(String path : userInputsFile.getFileUtilsInterface().listFilePaths(dataPath.toString())){ files.add(Path.of(path)); } }else{ diff --git a/kraftwerk-core/pom.xml b/kraftwerk-core/pom.xml index 14ecf692..bc2f9842 100644 --- a/kraftwerk-core/pom.xml +++ b/kraftwerk-core/pom.xml @@ -102,6 +102,7 @@ io.minio minio 8.5.10 + @@ -111,5 +112,4 @@ 0.10.3 - \ No newline at end of file diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java index bc5bddad..197e960f 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java @@ -23,9 +23,9 @@ public class WriterSequence { public void writeOutputFiles(Path inDirectory,LocalDateTime executionDateTime, VtlBindings vtlBindings, Map modeInputsMap, Map metadataModels, List errors, Statement database) throws KraftwerkException { - Path outDirectory = FileUtils.transformToOut(inDirectory,executionDateTime); + Path outDirectory = FileUtilsInterface.transformToOut(inDirectory,executionDateTime); - writeCsvFiles(outDirectory, vtlBindings, modeInputsMap, metadataModels, errors, null, database); + writeOutputFiles(inDirectory, executionDateTime,vtlBindings, modeInputsMap, metadataModels, errors, null, database); writeParquetFiles(outDirectory, vtlBindings, modeInputsMap, metadataModels, errors, database); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index 46d2cd48..5d73e154 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -176,7 +176,7 @@ public void deleteDirectory(Path directoryPath) throws KraftwerkException { } /** - * List the files in the directory + * List the file names in the directory * @param dir * @return */ @@ -188,6 +188,14 @@ public List listFiles(String dir) { .toList(); } + @Override + public List listFilePaths(String dir) { + return Stream.of(new File(dir).listFiles()) + .filter(file -> !file.isDirectory()) + .map(File::getAbsolutePath) + .toList(); + } + @Override public Path getTempVtlFilePath(UserInputs userInputs, String step, String dataset) { createDirectoryIfNotExist(FileUtilsInterface.transformToTemp(userInputs.getInputDirectory())); @@ -236,11 +244,14 @@ public URL convertToUrl(String userField, Path inputDirectory) { @Override @Nullable public Boolean isDirectory(String path) { + File file = new File(path); + if(file.isDirectory()){ + return true; + } if(!Files.isRegularFile(Path.of(path))){ return null; } - File file = new File(path); - return file.isDirectory(); + return false; } @Override diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java index d22ff658..857f755d 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java @@ -44,6 +44,8 @@ private static Path transformToOther(Path inDirectory, String other) { List listFiles(String dir); + List listFilePaths(String dir); + Path getTempVtlFilePath(UserInputs userInputs, String step, String dataset); Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java index 6796eed8..eb65af93 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -144,6 +144,11 @@ public List listFiles(String dir) { } } + @Override + public List listFilePaths(String dir) { + return listFiles(dir); + } + @Override public Path getTempVtlFilePath(UserInputs userInputs, String step, String dataset) { return FileUtilsInterface.transformToTemp(userInputs.getInputDirectory()).resolve(step+ dataset+".vtl"); @@ -177,7 +182,22 @@ public URL convertToUrl(String userField, Path inputDirectory) { @Override public Boolean isDirectory(String path){ - return path.endsWith("/") || path.endsWith("\\"); + try { + //List files of parent to check if directory + Iterable> results = minioClient.listObjects( + ListObjectsArgs.builder().bucket(bucketName).prefix(Path.of(path).getParent().toString()).recursive(true).build()); + + for (Result result : results) { + if(result.get().objectName().equals(Path.of(path).getFileName().toString())){ + return result.get().isDir(); + } + } + log.warn("S3 File or folder {} not found in {}", Path.of(path).getFileName().toString(), Path.of(path).getParent().toString()); + return null; + } catch (Exception e) { + log.error(e.toString()); + return null; + } } @Override diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java index b7b3813e..16b4b5f4 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java @@ -5,6 +5,8 @@ import static org.junit.jupiter.api.Assertions.assertTrue; import java.io.File; +import java.io.IOException; +import java.nio.file.Files; import java.nio.file.Path; import java.nio.file.Paths; import java.sql.Connection; @@ -21,7 +23,6 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.metadata.Variable; import fr.insee.kraftwerk.core.metadata.VariableType; -import fr.insee.kraftwerk.core.utils.FileUtils; import fr.insee.kraftwerk.core.utils.SqlUtils; import org.junit.jupiter.api.AfterAll; import org.junit.jupiter.api.Assertions; @@ -91,8 +92,8 @@ void testGetDatasetOutputNames() { @Test @Order(3) - void testWriteCsv() throws KraftwerkException, SQLException { - FileUtils.createDirectoryIfNotExist(outputFiles.getOutputFolder()); + void testWriteCsv() throws KraftwerkException, IOException { + Files.createDirectories(outputFiles.getOutputFolder()); Map metaModels = new HashMap<>(); MetadataModel metMod = new MetadataModel(); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java index 97b06993..6840d859 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java @@ -11,7 +11,6 @@ import fr.insee.kraftwerk.core.outputs.parquet.ParquetOutputFiles; import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; -import fr.insee.kraftwerk.core.utils.FileUtils; import fr.insee.kraftwerk.core.utils.SqlUtils; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.vtl.model.Dataset; diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/SqlUtilsTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/SqlUtilsTest.java index 268dca57..fc606c17 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/SqlUtilsTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/SqlUtilsTest.java @@ -5,6 +5,7 @@ import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.inputs.UserInputsFile; import fr.insee.kraftwerk.core.metadata.VariableType; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.vtl.model.Dataset; import fr.insee.vtl.model.InMemoryDataset; @@ -38,7 +39,8 @@ void convertVTLBindingTest() throws SQLException, KraftwerkException { //Given UserInputsFile testUserInputsFile = new UserInputsFile( Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "user_inputs/inputs_valid_several_modes.json"), - Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "user_inputs")); + Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "user_inputs"), + new FileSystemImpl()); VtlBindings vtlBindings = new VtlBindings(); Dataset testDataset = new InMemoryDataset(List.of(), List.of(new Structured.Component("TestString", String.class, Dataset.Role.IDENTIFIER))); diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java index 79cc453b..f2be95d1 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java @@ -10,6 +10,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; +import fr.insee.kraftwerk.core.exceptions.NullException; import fr.insee.kraftwerk.core.inputs.UserInputsFile; import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.metadata.MetadataUtils; @@ -17,10 +18,8 @@ import fr.insee.kraftwerk.core.outputs.OutputFiles; import fr.insee.kraftwerk.core.outputs.csv.CsvOutputFiles; import fr.insee.kraftwerk.core.sequence.*; -import fr.insee.kraftwerk.core.utils.CsvUtils; import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; -import fr.insee.kraftwerk.core.utils.FileUtils; import fr.insee.kraftwerk.core.utils.SqlUtils; import fr.insee.kraftwerk.core.vtl.VtlBindings; import io.cucumber.java.AfterAll; @@ -110,13 +109,13 @@ public void init_VTL_script(String vtlScriptName, String variableToCreate, Strin @When("Step 1 : We initialize the input files") public void initialize_input_files() throws KraftwerkException { System.out.println("InDirectory value : " + inDirectory); - userInputsFile = controlInputSequence.getUserInputs(inDirectory, new FileSystemImpl()); + userInputs = controlInputSequence.getUserInputs(inDirectory, new FileSystemImpl()); vtlBindings = new VtlBindings(); } @When("Step 1 : We initialize with input file {string}") public void initialize_with_specific_input(String inputFileName) throws KraftwerkException { - userInputsFile = new UserInputsFile(inDirectory.resolve(inputFileName), inDirectory, new FileSystemImpl()); + userInputs = new UserInputsFile(inDirectory.resolve(inputFileName), inDirectory, new FileSystemImpl()); vtlBindings = new VtlBindings(); } From cde44aa513a21aeeb0575481dda04a6b4cd8b6f1 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 21 Jun 2024 15:38:21 +0200 Subject: [PATCH 18/46] Changed file system I/O to use FileUtilsInterface --- .../kraftwerk/api/batch/KraftwerkBatch.java | 2 +- .../kraftwerk/api/process/MainProcessing.java | 17 +- .../api/process/MainProcessingGenesis.java | 12 +- .../api/services/KraftwerkService.java | 24 +- .../kraftwerk/api/services/MainService.java | 6 +- .../api/services/SplitterService.java | 8 + .../api/services/StepByStepService.java | 32 +-- .../fr/insee/kraftwerk/core/Constants.java | 15 +- .../dataprocessing/CalculatedProcessing.java | 5 +- .../dataprocessing/CleanUpProcessing.java | 5 +- .../core/dataprocessing/DataProcessing.java | 11 +- .../dataprocessing/DataProcessingManager.java | 9 +- .../core/dataprocessing/GroupProcessing.java | 5 +- .../InformationLevelsProcessing.java | 5 +- .../dataprocessing/LunaticDataProcessing.java | 5 +- .../MultimodeTransformations.java | 5 +- .../dataprocessing/PaperDataProcessing.java | 5 +- .../ReconciliationProcessing.java | 9 +- .../TCMSequencesProcessing.java | 7 +- .../UnimodalDataProcessing.java | 5 +- .../dataprocessing/XformsDataProcessing.java | 5 +- .../extradata/paradata/ParadataParser.java | 46 ++-- .../reportingdata/CSVReportingDataParser.java | 34 ++- .../reportingdata/ReportingDataParser.java | 9 +- .../reportingdata/XMLReportingDataParser.java | 13 +- .../core/inputs/UserInputsGenesis.java | 15 +- .../kraftwerk/core/metadata/DDIReader.java | 26 +- .../core/metadata/MetadataUtils.java | 9 +- .../core/metadata/MetadataUtilsGenesis.java | 9 +- .../kraftwerk/core/outputs/OutputFiles.java | 5 +- .../core/outputs/csv/CsvOutputFiles.java | 15 +- .../outputs/parquet/ParquetOutputFiles.java | 19 +- .../kraftwerk/core/parsers/DataParser.java | 80 +++---- .../core/parsers/DataParserManager.java | 11 +- .../core/parsers/LunaticJsonDataParser.java | 10 +- .../core/parsers/LunaticXmlDataParser.java | 7 +- .../core/parsers/PaperDataParser.java | 61 +++-- .../core/parsers/XformsDataParser.java | 7 +- .../core/sequence/BuildBindingsSequence.java | 15 +- .../BuildBindingsSequenceGenesis.java | 18 +- .../core/sequence/ControlInputSequence.java | 7 +- .../sequence/ControlInputSequenceGenesis.java | 9 +- .../core/sequence/MultimodalSequence.java | 16 +- .../core/sequence/UnimodalSequence.java | 18 +- .../sequence/VtlReaderWriterSequence.java | 7 +- .../core/sequence/WriterSequence.java | 29 ++- .../insee/kraftwerk/core/utils/CsvUtils.java | 14 +- .../kraftwerk/core/utils/TextFileReader.java | 18 +- .../kraftwerk/core/utils/TextFileWriter.java | 34 +-- .../kraftwerk/core/utils/XMLSplitter.java | 1 + .../kraftwerk/core/utils/XmlFileReader.java | 16 +- .../core/utils/files/FileSystemImpl.java | 224 ++++++++++-------- .../core/utils/files/FileUtilsInterface.java | 21 ++ .../kraftwerk/core/utils/files/MinioImpl.java | 124 +++++----- .../insee/kraftwerk/core/vtl/VtlExecute.java | 9 +- .../unit_tests/AggregateDefinitions.java | 9 +- .../unit_tests/EvalScriptDefinitions.java | 3 +- .../unit_tests/ExportDatasetDefinitions.java | 5 +- .../CalculatedProcessingTest.java | 7 +- .../dataprocessing/CleanUpProcessingTest.java | 6 +- .../dataprocessing/GroupProcessingTest.java | 6 +- .../dataprocessing/InformationLevelsTest.java | 8 +- .../PaperDataProcessingTest.java | 6 +- .../dataprocessing/ReconciliationTest.java | 9 +- .../TCMSequenceProcessingTest.java | 6 +- .../extradata/CSVReportingDataParserTest.java | 10 +- .../core/extradata/ParaDataParserTest.java | 3 +- .../extradata/XMLReportingDataParserTest.java | 12 +- .../core/metadata/DDIReaderTest.java | 12 +- .../kraftwerk/core/metadata/VariableTest.java | 11 +- .../core/outputs/CsvOutputFilesTest.java | 2 +- .../core/outputs/ParquetOutputFilesTest.java | 2 +- .../outputs/scripts/ImportScriptTest.java | 9 +- .../parsers/LunaticXmlDataParserTest.java | 13 +- .../core/parsers/PaperDataParserTest.java | 9 +- .../sequence/BuildBindingsSequenceTest.java | 4 +- .../core/utils/xsl/SaxonTransformerTest.java | 10 +- .../kraftwerk/core/vtl/VtlBindingsTest.java | 6 +- .../core/vtl/VtlJsonDatasetWriterTest.java | 7 +- .../CalculatedProcessingDefinition.java | 9 +- .../DDIGetterDefinitions.java | 3 +- .../functional_tests/MainDefinitions.java | 10 +- .../functional_tests/ParadataDefinitions.java | 8 +- .../VariablesGetterDefinitions.java | 3 +- 84 files changed, 778 insertions(+), 583 deletions(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java index b0864677..58fba5e8 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java @@ -73,7 +73,7 @@ public void run(String... args) throws Exception{ //Archive if(Boolean.TRUE.equals(archiveAtEnd)){ - KraftwerkService kraftwerkService = new KraftwerkService(); + KraftwerkService kraftwerkService = new KraftwerkService(minioConfig); kraftwerkService.archive(inDirectory, new MinioImpl(minioClient, minioConfig.getBucketName())); } diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java index b3768ccb..a2fda208 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java @@ -46,7 +46,7 @@ public class MainProcessing { private KraftwerkExecutionLog kraftwerkExecutionLog; private final List errors = new ArrayList<>(); private LocalDateTime executionDateTime; - private FileUtilsInterface fileUtilsInterface; + private final FileUtilsInterface fileUtilsInterface; /** @@ -64,7 +64,7 @@ public MainProcessing(String inDirectoryParam, boolean fileByFile,boolean withAl this.withAllReportingData = withAllReportingData; this.withDDI=withDDI; this.limitSize = limitSize; - controlInputSequence = new ControlInputSequence(defaultDirectory); + controlInputSequence = new ControlInputSequence(defaultDirectory, fileUtilsInterface); this.fileUtilsInterface = fileUtilsInterface; } @@ -75,7 +75,7 @@ public MainProcessing(String inDirectoryParam, boolean fileByFile, String defaul this.withAllReportingData = !fileByFile; this.withDDI=true; this.limitSize = limitSize; - controlInputSequence = new ControlInputSequence(defaultDirectory); + controlInputSequence = new ControlInputSequence(defaultDirectory, fileUtilsInterface); this.fileUtilsInterface = fileUtilsInterface; } @@ -117,7 +117,7 @@ public void init() throws KraftwerkException { userInputsFile = controlInputSequence.getUserInputs(inDirectory, fileUtilsInterface); - metadataModels = withDDI ? MetadataUtils.getMetadata(userInputsFile.getModeInputsMap()) : MetadataUtils.getMetadataFromLunatic(userInputsFile.getModeInputsMap()); + metadataModels = withDDI ? MetadataUtils.getMetadata(userInputsFile.getModeInputsMap(), fileUtilsInterface) : MetadataUtils.getMetadataFromLunatic(userInputsFile.getModeInputsMap()); userInputsFileList = getUserInputsFile(userInputsFile, fileByFile); @@ -138,7 +138,7 @@ public void init() throws KraftwerkException { /* Step 2 : unimodal data */ private void unimodalProcess() throws KraftwerkException { - BuildBindingsSequence buildBindingsSequence = new BuildBindingsSequence(withAllReportingData); + BuildBindingsSequence buildBindingsSequence = new BuildBindingsSequence(withAllReportingData, fileUtilsInterface); for (String dataMode : userInputsFile.getModeInputsMap().keySet()) { MetadataModel metadataForMode = metadataModels.get(dataMode); buildBindingsSequence.buildVtlBindings(userInputsFile, dataMode, vtlBindings, metadataForMode, withDDI, kraftwerkExecutionLog); @@ -156,17 +156,17 @@ private void multimodalProcess(Statement database){ /* Step 4 : Write output files */ private void outputFileWriter(Statement database) throws KraftwerkException { WriterSequence writerSequence = new WriterSequence(); - writerSequence.writeOutputFiles(inDirectory, executionDateTime, vtlBindings, userInputsFile.getModeInputsMap(), metadataModels, errors, database); + writerSequence.writeOutputFiles(inDirectory, executionDateTime, vtlBindings, userInputsFile.getModeInputsMap(), metadataModels, errors, database, fileUtilsInterface); } /* Step 5 : Write errors */ private void writeErrors() { - TextFileWriter.writeErrorsFile(inDirectory, executionDateTime, errors); + TextFileWriter.writeErrorsFile(inDirectory, executionDateTime, errors, fileUtilsInterface); } /* Step 6 : Write log */ - private void writeLog() {TextFileWriter.writeLogFile(inDirectory, executionDateTime, kraftwerkExecutionLog);} + private void writeLog() {TextFileWriter.writeLogFile(inDirectory, executionDateTime, kraftwerkExecutionLog, fileUtilsInterface);} private static List getUserInputsFile(UserInputsFile source, boolean fileByFile) throws KraftwerkException { List userInputsFileList = new ArrayList<>(); @@ -199,7 +199,6 @@ private static List getUserInputsFile(UserInputsFile source, boo return userInputsFileList; } - //TODO FIX HERE private static List getFilesToProcess(UserInputsFile userInputsFile, String dataMode) { List files = new ArrayList<>(); ModeInputs modeInputs = userInputsFile.getModeInputs(dataMode); diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java index 1b979b79..99b60723 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java @@ -46,7 +46,7 @@ public class MainProcessingGenesis { @Getter private UserInputsGenesis userInputs; private LocalDateTime executionDateTime; - private FileUtilsInterface fileUtilsInterface; + private final FileUtilsInterface fileUtilsInterface; private Statement database; /* SPECIFIC VARIABLES */ @@ -73,7 +73,7 @@ public void init(String idCampaign) throws KraftwerkException, IOException { //We build userInputs for the given questionnaire userInputs = new UserInputsGenesis(controlInputSequenceGenesis.isHasConfigFile(), inDirectory, client.getModes(idCampaign), fileUtilsInterface); if (!userInputs.getModes().isEmpty()) { - metadataModels = MetadataUtilsGenesis.getMetadata(userInputs.getModeInputsMap()); + metadataModels = MetadataUtilsGenesis.getMetadata(userInputs.getModeInputsMap(), fileUtilsInterface); } else { log.error("No source found for campaign " + idCampaign); } @@ -110,9 +110,9 @@ public void runMain(String idCampaign) throws KraftwerkException, IOException { } private void unimodalProcess(List suLatest) throws KraftwerkException { - BuildBindingsSequenceGenesis buildBindingsSequenceGenesis = new BuildBindingsSequenceGenesis(); + BuildBindingsSequenceGenesis buildBindingsSequenceGenesis = new BuildBindingsSequenceGenesis(fileUtilsInterface); for (String dataMode : userInputs.getModeInputsMap().keySet()) { - buildBindingsSequenceGenesis.buildVtlBindings(dataMode, vtlBindings, metadataModels, suLatest, inDirectory, database, fileUtilsInterface); + buildBindingsSequenceGenesis.buildVtlBindings(dataMode, vtlBindings, metadataModels, suLatest, inDirectory, database); UnimodalSequence unimodal = new UnimodalSequence(); unimodal.applyUnimodalSequence(userInputs, dataMode, vtlBindings, errors, metadataModels, fileUtilsInterface); } @@ -127,12 +127,12 @@ private void multimodalProcess() { /* Step 4 : Write output files */ private void outputFileWriter() throws KraftwerkException { WriterSequence writerSequence = new WriterSequence(); - writerSequence.writeOutputFiles(inDirectory, executionDateTime, vtlBindings, userInputs.getModeInputsMap(), metadataModels, errors, database); + writerSequence.writeOutputFiles(inDirectory, executionDateTime, vtlBindings, userInputs.getModeInputsMap(), metadataModels, errors, database, fileUtilsInterface); } /* Step 5 : Write errors */ private void writeErrors() { - TextFileWriter.writeErrorsFile(inDirectory, executionDateTime, errors); + TextFileWriter.writeErrorsFile(inDirectory, executionDateTime, errors, fileUtilsInterface); } } diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java index 1b05c0c6..dd1a39b6 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java @@ -1,14 +1,19 @@ package fr.insee.kraftwerk.api.services; +import fr.insee.kraftwerk.api.configuration.MinioConfig; import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.sequence.ControlInputSequence; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.MinioImpl; +import io.minio.MinioClient; import io.swagger.v3.oas.annotations.responses.ApiResponse; import io.swagger.v3.oas.annotations.responses.ApiResponses; import jakarta.annotation.PostConstruct; import org.apache.commons.lang3.StringUtils; +import org.springframework.beans.factory.annotation.Autowired; import org.springframework.beans.factory.annotation.Value; import org.springframework.http.ResponseEntity; import org.springframework.web.bind.annotation.RestController; @@ -37,16 +42,29 @@ public class KraftwerkService { @Value("${fr.insee.postcollecte.size-limit}") protected long limitSize; + MinioConfig minioConfig; + + protected ControlInputSequence controlInputSequence ; + + @Autowired + public KraftwerkService(MinioConfig minioConfig){ + this.minioConfig = minioConfig; + } @PostConstruct public void initializeWithProperties() { - - + FileUtilsInterface fileUtilsInterface; + if(minioConfig.isEnable()){ + MinioClient minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); + fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + }else{ + fileUtilsInterface = new FileSystemImpl(); + } if (StringUtils.isNotEmpty(csvOutputsQuoteChar)) { Constants.setCsvOutputQuoteChar(csvOutputsQuoteChar.trim().charAt(0)); } - controlInputSequence = new ControlInputSequence(defaultDirectory); + controlInputSequence = new ControlInputSequence(defaultDirectory, fileUtilsInterface); } public ResponseEntity archive(String inDirectoryParam, FileUtilsInterface fileUtilsInterface) { diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java index e8a1ddf1..78b2a8ea 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java @@ -30,12 +30,12 @@ public class MainService extends KraftwerkService { ConfigProperties configProperties; - MinioConfig minioConfig; MinioClient minioClient; @Autowired public MainService(ConfigProperties configProperties, MinioConfig minioConfig) { - this.configProperties = configProperties; + super(minioConfig); + this.configProperties = configProperties; this.minioConfig = minioConfig; if(minioConfig.isEnable()){ minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); @@ -141,7 +141,7 @@ public ResponseEntity mainGenesis( MainProcessingGenesis mpGenesis = new MainProcessingGenesis(configProperties, fileUtilsInterface); try { - mpGenesis.setControlInputSequenceGenesis(new ControlInputSequenceGenesis(defaultDirectory)); + mpGenesis.setControlInputSequenceGenesis(new ControlInputSequenceGenesis(defaultDirectory, fileUtilsInterface)); mpGenesis.runMain(idCampaign); } catch (KraftwerkException e) { return ResponseEntity.status(e.getStatus()).body(e.getMessage()); diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java index 7a0c93f0..d0055789 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java @@ -1,9 +1,11 @@ package fr.insee.kraftwerk.api.services; +import fr.insee.kraftwerk.api.configuration.MinioConfig; import fr.insee.kraftwerk.core.utils.XMLSplitter; import io.swagger.v3.oas.annotations.Operation; import io.swagger.v3.oas.annotations.tags.Tag; import lombok.extern.log4j.Log4j2; +import org.springframework.beans.factory.annotation.Autowired; import org.springframework.http.HttpStatus; import org.springframework.http.ResponseEntity; import org.springframework.web.bind.annotation.PutMapping; @@ -15,6 +17,12 @@ @Log4j2 public class SplitterService extends KraftwerkService{ //TODO add MinIO support + + @Autowired + public SplitterService(MinioConfig minioConfig) { + super(minioConfig); + } + @Operation(summary = "Split a XML file into smaller ones") @PutMapping(path = "/split/lunatic-xml") public ResponseEntity saveResponsesFromXmlFile(@RequestParam("inputFolder") String inputFolder, diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java index c6e07fae..39fa9c98 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java @@ -38,12 +38,12 @@ @RestController @Tag(name = "${tag.stepbystep}") public class StepByStepService extends KraftwerkService { - MinioConfig minioConfig; MinioClient minioClient; @Autowired public StepByStepService(MinioConfig minioConfig) { - this.minioConfig = minioConfig; + super(minioConfig); + //TODO warn if enable null if(minioConfig.isEnable()){ minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); } @@ -73,8 +73,8 @@ public ResponseEntity buildVtlBindings( } //Process - BuildBindingsSequence buildBindingsSequence = new BuildBindingsSequence(withAllReportingData); - VtlReaderWriterSequence vtlWriterSequence = new VtlReaderWriterSequence(); + BuildBindingsSequence buildBindingsSequence = new BuildBindingsSequence(withAllReportingData, fileUtilsInterface); + VtlReaderWriterSequence vtlWriterSequence = new VtlReaderWriterSequence(fileUtilsInterface); for (String dataMode : mp.getUserInputsFile().getModeInputsMap().keySet()) { try{ @@ -117,14 +117,14 @@ public ResponseEntity buildVtlBindingsByDataMode( } //Process - BuildBindingsSequence buildBindingsSequence = new BuildBindingsSequence(withAllReportingData); + BuildBindingsSequence buildBindingsSequence = new BuildBindingsSequence(withAllReportingData, fileUtilsInterface); try{ buildBindingsSequence.buildVtlBindings(mp.getUserInputsFile(), dataMode, mp.getVtlBindings(), mp.getMetadataModels().get(dataMode), withDDI, null); } catch (KraftwerkException e) { return ResponseEntity.status(e.getStatus()).body(e.getMessage()); } - VtlReaderWriterSequence vtlWriterSequence = new VtlReaderWriterSequence(); + VtlReaderWriterSequence vtlWriterSequence = new VtlReaderWriterSequence(fileUtilsInterface); vtlWriterSequence.writeTempBindings(mp.getInDirectory(), dataMode, mp.getVtlBindings(), StepEnum.BUILD_BINDINGS); return ResponseEntity.ok(inDirectoryParam+ " - "+dataMode); @@ -162,19 +162,19 @@ public ResponseEntity unimodalProcessing( VtlBindings vtlBindings = new VtlBindings(); List errors = new ArrayList<>(); - VtlReaderWriterSequence vtlReaderSequence = new VtlReaderWriterSequence(); + VtlReaderWriterSequence vtlReaderSequence = new VtlReaderWriterSequence(fileUtilsInterface); vtlReaderSequence.readDataset(FileUtilsInterface.transformToTemp(inDirectory).toString(),dataMode, StepEnum.BUILD_BINDINGS, vtlBindings); - Map metadataModelMap = MetadataUtils.getMetadata(userInputsFile.getModeInputsMap()); + Map metadataModelMap = MetadataUtils.getMetadata(userInputsFile.getModeInputsMap(), fileUtilsInterface); //Process UnimodalSequence unimodal = new UnimodalSequence(); unimodal.applyUnimodalSequence(userInputsFile, dataMode, vtlBindings, errors, metadataModelMap, fileUtilsInterface); //Write technical outputs - VtlReaderWriterSequence vtlWriterSequence = new VtlReaderWriterSequence(); + VtlReaderWriterSequence vtlWriterSequence = new VtlReaderWriterSequence(fileUtilsInterface); vtlWriterSequence.writeTempBindings(inDirectory, dataMode, vtlBindings, StepEnum.UNIMODAL_PROCESSING); - TextFileWriter.writeErrorsFile(inDirectory, LocalDateTime.now(), errors); + TextFileWriter.writeErrorsFile(inDirectory, LocalDateTime.now(), errors, fileUtilsInterface); return ResponseEntity.ok(inDirectoryParam+ " - "+dataMode); @@ -210,7 +210,7 @@ public ResponseEntity multimodalProcessing( List errors = new ArrayList<>(); - VtlReaderWriterSequence vtlReaderWriterSequence = new VtlReaderWriterSequence(); + VtlReaderWriterSequence vtlReaderWriterSequence = new VtlReaderWriterSequence(fileUtilsInterface); //Test VtlBindings vtlBindings = new VtlBindings(); @@ -218,7 +218,7 @@ public ResponseEntity multimodalProcessing( vtlReaderWriterSequence.readDataset(FileUtilsInterface.transformToTemp(inDirectory).toString(),dataMode, StepEnum.UNIMODAL_PROCESSING, vtlBindings); } - Map metadataModelMap = MetadataUtils.getMetadata(userInputsFile.getModeInputsMap()); + Map metadataModelMap = MetadataUtils.getMetadata(userInputsFile.getModeInputsMap(), fileUtilsInterface); //Process try(Connection database = SqlUtils.openConnection()) { @@ -232,7 +232,7 @@ public ResponseEntity multimodalProcessing( for (String datasetName : vtlBindings.getDatasetNames()) { vtlReaderWriterSequence.writeTempBindings(inDirectory, datasetName, vtlBindings, StepEnum.MULTIMODAL_PROCESSING); } - TextFileWriter.writeErrorsFile(inDirectory, LocalDateTime.now(), errors); + TextFileWriter.writeErrorsFile(inDirectory, LocalDateTime.now(), errors, fileUtilsInterface); return ResponseEntity.ok(inDirectoryParam); @@ -267,7 +267,7 @@ public ResponseEntity writeOutputFiles( for (String name : fileNames){ String pathBindings = path + File.separator + name; String bindingName = name.substring(0, name.indexOf("_"+StepEnum.MULTIMODAL_PROCESSING.getStepLabel())); - VtlReaderWriterSequence vtlReaderSequence = new VtlReaderWriterSequence(); + VtlReaderWriterSequence vtlReaderSequence = new VtlReaderWriterSequence(fileUtilsInterface); vtlReaderSequence.readDataset(pathBindings, bindingName, vtlBindings); } WriterSequence writerSequence = new WriterSequence(); @@ -277,9 +277,9 @@ public ResponseEntity writeOutputFiles( } catch (KraftwerkException e) { return ResponseEntity.status(e.getStatus()).body(e.getMessage()); } - Map metadataModelMap = MetadataUtils.getMetadata(userInputsFile.getModeInputsMap()); + Map metadataModelMap = MetadataUtils.getMetadata(userInputsFile.getModeInputsMap(), fileUtilsInterface); try (Statement database = SqlUtils.openConnection().createStatement()) { - writerSequence.writeOutputFiles(inDirectory, executionDateTime, vtlBindings, userInputsFile.getModeInputsMap(), metadataModelMap, errors, database); + writerSequence.writeOutputFiles(inDirectory, executionDateTime, vtlBindings, userInputsFile.getModeInputsMap(), metadataModelMap, errors, database, fileUtilsInterface); } return ResponseEntity.ok(inDirectoryParam); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/Constants.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/Constants.java index 10d9067d..ab3db1a3 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/Constants.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/Constants.java @@ -1,18 +1,20 @@ package fr.insee.kraftwerk.core; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.Getter; import lombok.extern.log4j.Log4j2; import org.json.simple.parser.JSONParser; import org.json.simple.parser.ParseException; import java.io.File; -import java.io.FileReader; import java.io.IOException; import java.io.InputStream; +import java.io.InputStreamReader; import java.net.MalformedURLException; import java.net.URI; import java.net.URISyntaxException; import java.net.URL; +import java.nio.charset.StandardCharsets; import java.nio.file.Path; import java.nio.file.Paths; import java.util.concurrent.TimeUnit; @@ -61,6 +63,8 @@ private Constants() {} public static final String DUCKDB_URL = "jdbc:duckdb:"; public static final int DB_CONNECTION_TRY_COUNT = 10; + public static final String DDI_FILE_REGEX = "ddi[\\w,\\s-]+\\.xml"; + public static final String LUNATIC_FILE_REGEX = "lunatic[\\w,\\s-]+\\.json"; // ----- Explicit Variables Names @@ -206,10 +210,11 @@ public static File getFileFromPath(String path) { * @throws ParseException * @throws IOException */ - public static Object readJsonSimple(Path filename) throws IOException, ParseException { - FileReader reader = new FileReader(filename.toString()); - JSONParser jsonParser = new JSONParser(); - return jsonParser.parse(reader); + public static Object readJsonSimple(Path filename, FileUtilsInterface fileUtilsInterface) throws IOException, ParseException { + try(InputStream inputStream = fileUtilsInterface.readFile(filename.toString())){ + JSONParser jsonParser = new JSONParser(); + return jsonParser.parse(new InputStreamReader(inputStream, StandardCharsets.UTF_8)); + } } // ---------- Maths function diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/CalculatedProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/CalculatedProcessing.java index 0eefff72..f6046afe 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/CalculatedProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/CalculatedProcessing.java @@ -2,6 +2,7 @@ import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.metadata.CalculatedVariables; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlScript; import lombok.extern.log4j.Log4j2; @@ -18,8 +19,8 @@ public class CalculatedProcessing extends DataProcessing { public static final int MAXIMAL_RESOLVING_ITERATIONS = 100; private CalculatedVariables calculatedVariables; - public CalculatedProcessing(VtlBindings vtlBindings, CalculatedVariables calculatedVariables) { - super(vtlBindings); + public CalculatedProcessing(VtlBindings vtlBindings, CalculatedVariables calculatedVariables, FileUtilsInterface fileUtilsInterface) { + super(vtlBindings, fileUtilsInterface); this.calculatedVariables = calculatedVariables; } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/CleanUpProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/CleanUpProcessing.java index bdb06e41..1317e6d7 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/CleanUpProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/CleanUpProcessing.java @@ -4,6 +4,7 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.metadata.PaperUcq; import fr.insee.kraftwerk.core.metadata.VariablesMap; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlScript; import lombok.extern.log4j.Log4j2; @@ -24,8 +25,8 @@ public class CleanUpProcessing extends DataProcessing { private Map metadataModels; - public CleanUpProcessing(VtlBindings vtlBindings, Map metadataModels) { - super(vtlBindings); + public CleanUpProcessing(VtlBindings vtlBindings, Map metadataModels, FileUtilsInterface fileUtilsInterface) { + super(vtlBindings, fileUtilsInterface); this.metadataModels=metadataModels; } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessing.java index 35e5b28a..f5a60433 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessing.java @@ -2,6 +2,7 @@ import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.utils.TextFileReader; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; import fr.insee.kraftwerk.core.vtl.VtlScript; @@ -25,9 +26,12 @@ public abstract class DataProcessing { protected final VtlBindings vtlBindings; VtlExecute vtlExecute; - protected DataProcessing(VtlBindings vtlBindings){ + FileUtilsInterface fileUtilsInterface; + + protected DataProcessing(VtlBindings vtlBindings, FileUtilsInterface fileUtilsInterface){ this.vtlBindings = vtlBindings; - vtlExecute = new VtlExecute(); + vtlExecute = new VtlExecute(fileUtilsInterface); + this.fileUtilsInterface = fileUtilsInterface; } public abstract String getStepName(); @@ -65,7 +69,8 @@ protected String applyAutomatedVtlInstructions(String bindingName, List errors){ - String vtlScript = TextFileReader.readFromPath(userVtlInstructionsPath); + //TODO change to interface + String vtlScript = TextFileReader.readFromPath(userVtlInstructionsPath, fileUtilsInterface); log.info(String.format("User VTL instructions read for step %s:%n%s", getStepName(), vtlScript)); if (! (vtlScript == null || vtlScript.isEmpty() || vtlScript.contentEquals("")) ) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessingManager.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessingManager.java index c26c2ea6..a8257fe3 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessingManager.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessingManager.java @@ -2,6 +2,7 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.parsers.DataFormat; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.extern.log4j.Log4j2; @@ -22,17 +23,17 @@ private DataProcessingManager() { * * @return One of the concrete parsers. */ - public static UnimodalDataProcessing getProcessingClass(DataFormat dataFormat, VtlBindings vtlBindings, MetadataModel metadataModel) { + public static UnimodalDataProcessing getProcessingClass(DataFormat dataFormat, VtlBindings vtlBindings, MetadataModel metadataModel, FileUtilsInterface fileUtilsInterface) { UnimodalDataProcessing dataProcessing = null; switch (dataFormat) { case XFORMS: - dataProcessing = new XformsDataProcessing(vtlBindings, metadataModel); + dataProcessing = new XformsDataProcessing(vtlBindings, metadataModel, fileUtilsInterface); break; case PAPER: - dataProcessing = new PaperDataProcessing(vtlBindings, metadataModel); + dataProcessing = new PaperDataProcessing(vtlBindings, metadataModel, fileUtilsInterface); break; case LUNATIC_XML , LUNATIC_JSON: - dataProcessing = new LunaticDataProcessing(vtlBindings, metadataModel); + dataProcessing = new LunaticDataProcessing(vtlBindings, metadataModel, fileUtilsInterface); break; default: log.warn("Unknown data collection tool, null returned."); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/GroupProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/GroupProcessing.java index dcf054f3..cda4868c 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/GroupProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/GroupProcessing.java @@ -2,6 +2,7 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.metadata.VariablesMap; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlScript; @@ -9,8 +10,8 @@ public class GroupProcessing extends DataProcessing{ private MetadataModel metadataModel; - public GroupProcessing(VtlBindings vtlBindings, MetadataModel metadataModel) { - super(vtlBindings); + public GroupProcessing(VtlBindings vtlBindings, MetadataModel metadataModel, FileUtilsInterface fileUtilsInterface) { + super(vtlBindings, fileUtilsInterface); this.metadataModel = metadataModel; } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/InformationLevelsProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/InformationLevelsProcessing.java index dfae189b..3848d713 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/InformationLevelsProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/InformationLevelsProcessing.java @@ -2,6 +2,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.metadata.MetadataModel; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlMacros; import fr.insee.kraftwerk.core.vtl.VtlScript; @@ -15,8 +16,8 @@ */ public class InformationLevelsProcessing extends DataProcessing { - public InformationLevelsProcessing(VtlBindings vtlBindings) { - super(vtlBindings); + public InformationLevelsProcessing(VtlBindings vtlBindings, FileUtilsInterface fileUtilsInterface) { + super(vtlBindings, fileUtilsInterface); } @Override diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/LunaticDataProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/LunaticDataProcessing.java index b0126759..40d17c09 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/LunaticDataProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/LunaticDataProcessing.java @@ -1,6 +1,7 @@ package fr.insee.kraftwerk.core.dataprocessing; import fr.insee.kraftwerk.core.metadata.MetadataModel; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlScript; @@ -9,8 +10,8 @@ */ public class LunaticDataProcessing extends UnimodalDataProcessing { - public LunaticDataProcessing(VtlBindings vtlBindings, MetadataModel metadataModel) { - super(vtlBindings, metadataModel); + public LunaticDataProcessing(VtlBindings vtlBindings, MetadataModel metadataModel, FileUtilsInterface fileUtilsInterface) { + super(vtlBindings, metadataModel, fileUtilsInterface); } @Override diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/MultimodeTransformations.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/MultimodeTransformations.java index aee13db4..2eacbb62 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/MultimodeTransformations.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/MultimodeTransformations.java @@ -1,12 +1,13 @@ package fr.insee.kraftwerk.core.dataprocessing; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlScript; public class MultimodeTransformations extends DataProcessing { - public MultimodeTransformations(VtlBindings vtlBindings) { - super(vtlBindings); + public MultimodeTransformations(VtlBindings vtlBindings, FileUtilsInterface fileUtilsInterface) { + super(vtlBindings, fileUtilsInterface); } @Override diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/PaperDataProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/PaperDataProcessing.java index 4f7606bc..1df415ef 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/PaperDataProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/PaperDataProcessing.java @@ -3,6 +3,7 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.metadata.UcqModality; import fr.insee.kraftwerk.core.metadata.UcqVariable; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlScript; @@ -13,8 +14,8 @@ */ public class PaperDataProcessing extends UnimodalDataProcessing { - public PaperDataProcessing(VtlBindings vtlBindings, MetadataModel metadataModel) { - super(vtlBindings, metadataModel); + public PaperDataProcessing(VtlBindings vtlBindings, MetadataModel metadataModel, FileUtilsInterface fileUtilsInterface) { + super(vtlBindings, metadataModel, fileUtilsInterface); } @Override diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/ReconciliationProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/ReconciliationProcessing.java index 34f0e188..07a3fcfe 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/ReconciliationProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/ReconciliationProcessing.java @@ -1,6 +1,7 @@ package fr.insee.kraftwerk.core.dataprocessing; import fr.insee.kraftwerk.core.Constants; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlMacros; import fr.insee.kraftwerk.core.vtl.VtlScript; @@ -17,14 +18,14 @@ public class ReconciliationProcessing extends DataProcessing { private final String modeVariableIdentifier; /** Return processing instance with default mode variable name. */ - public ReconciliationProcessing(VtlBindings vtlBindings) { - super(vtlBindings); + public ReconciliationProcessing(VtlBindings vtlBindings, FileUtilsInterface fileUtilsInterface) { + super(vtlBindings, fileUtilsInterface); this.modeVariableIdentifier = Constants.MODE_VARIABLE_NAME; } /** Return processing instance with mode variable name given. */ - public ReconciliationProcessing(VtlBindings vtlBindings, String modeVariableName) { - super(vtlBindings); + public ReconciliationProcessing(VtlBindings vtlBindings, String modeVariableName, FileUtilsInterface fileUtilsInterface) { + super(vtlBindings, fileUtilsInterface); this.modeVariableIdentifier = modeVariableName; } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/TCMSequencesProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/TCMSequencesProcessing.java index a8b637f6..17839cd1 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/TCMSequencesProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/TCMSequencesProcessing.java @@ -3,6 +3,7 @@ import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.utils.TextFileReader; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlScript; import lombok.extern.slf4j.Slf4j; @@ -16,8 +17,8 @@ public class TCMSequencesProcessing extends DataProcessing { private final String vtlDirectory; private final MetadataModel metadataModel; - public TCMSequencesProcessing(VtlBindings vtlBindings, MetadataModel metadataModel,String vtlDirectory) { - super(vtlBindings); + public TCMSequencesProcessing(VtlBindings vtlBindings, MetadataModel metadataModel, String vtlDirectory, FileUtilsInterface fileUtilsInterface) { + super(vtlBindings, fileUtilsInterface); this.metadataModel = metadataModel; this.vtlDirectory = vtlDirectory; } @@ -60,7 +61,7 @@ protected VtlScript generateVtlInstructions(String bindingName, MetadataModel me for(TCMModuleEnum tcmModuleEnum : tcmSequenceEnum.getTcmModules()){ Path tcmModulePath = Path.of(this.vtlDirectory).resolve("tcm").resolve(tcmModuleEnum.toString() + ".vtl"); if(tcmModulePath.toFile().exists()){ - vtlScriptBuilder.append(TextFileReader.readFromPath(tcmModulePath)); + vtlScriptBuilder.append(TextFileReader.readFromPath(tcmModulePath, fileUtilsInterface)); vtlScriptBuilder.append(System.lineSeparator()); log.info("TCM VTL instructions read for module " + tcmModuleEnum); }else{ diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/UnimodalDataProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/UnimodalDataProcessing.java index 1a891820..f20f0873 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/UnimodalDataProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/UnimodalDataProcessing.java @@ -1,6 +1,7 @@ package fr.insee.kraftwerk.core.dataprocessing; import fr.insee.kraftwerk.core.metadata.MetadataModel; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlScript; @@ -11,8 +12,8 @@ public abstract class UnimodalDataProcessing extends DataProcessing { protected MetadataModel metadataModel; - protected UnimodalDataProcessing(VtlBindings vtlBindings, MetadataModel metadataModel){ - super(vtlBindings); + protected UnimodalDataProcessing(VtlBindings vtlBindings, MetadataModel metadataModel, FileUtilsInterface fileUtilsInterface){ + super(vtlBindings, fileUtilsInterface); this.metadataModel = metadataModel; } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/XformsDataProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/XformsDataProcessing.java index b0c52bc9..81bb30ad 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/XformsDataProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/XformsDataProcessing.java @@ -1,6 +1,7 @@ package fr.insee.kraftwerk.core.dataprocessing; import fr.insee.kraftwerk.core.metadata.MetadataModel; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlScript; @@ -9,8 +10,8 @@ */ public class XformsDataProcessing extends UnimodalDataProcessing { - public XformsDataProcessing(VtlBindings vtlBindings, MetadataModel metadataModel) { - super(vtlBindings, metadataModel); + public XformsDataProcessing(VtlBindings vtlBindings, MetadataModel metadataModel, FileUtilsInterface fileUtilsInterface) { + super(vtlBindings, metadataModel, fileUtilsInterface); } @Override diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/paradata/ParadataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/paradata/ParadataParser.java index 4238ebb9..3101e6f2 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/paradata/ParadataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/paradata/ParadataParser.java @@ -8,6 +8,7 @@ import fr.insee.kraftwerk.core.metadata.VariablesMap; import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import org.json.simple.JSONArray; import org.json.simple.JSONObject; @@ -26,6 +27,12 @@ public class ParadataParser { private final List inputFields = Arrays.asList("RADIO", "CHECKBOX", "INPUT", "DATEPICKER"); + private final FileUtilsInterface fileUtilsInterface; + + public ParadataParser(FileUtilsInterface fileUtilsInterface) { + this.fileUtilsInterface = fileUtilsInterface; + } + public void parseParadata(Paradata paradata, SurveyRawData surveyRawData) throws NullException { log.info("Paradata parser being implemented for Survey Unit : {} !", @@ -35,32 +42,25 @@ public void parseParadata(Paradata paradata, SurveyRawData surveyRawData) throws throw new NullException("JSONFile not defined"); if (!filePath.toString().contentEquals("")) { -//TODO Change to interface + // Parse each ParaDataUE + List listParaDataUE = new ArrayList<>(); // Get all filepaths for each ParadataUE - try (Stream walk = Files.walk(filePath)) { - List listFilePaths = walk.filter(Files::isRegularFile) - .filter(file -> surveyRawData.getIdSurveyUnits().contains(getIdFromFilename(file))).toList(); - // Parse each ParaDataUE - List listParaDataUE = new ArrayList<>(); - - for (Path fileParaDataPath : listFilePaths) { - ParaDataUE paraDataUE = new ParaDataUE(); - paraDataUE.setFilepath(fileParaDataPath); - parseParadataUE(paraDataUE, surveyRawData); - paraDataUE.sortEvents(); - paraDataUE.setSurveyValidationDateTimeStamp(Constants.PARADATA_SURVEY_VALIDATION_EVENT_NAME); - if (paraDataUE.getEvents().size() > 2) { - paraDataUE.createOrchestratorsAndSessions(); - integrateParaDataVariablesIntoUE(paraDataUE, surveyRawData); - listParaDataUE.add(paraDataUE); - } + for(String fileParaDataPath : fileUtilsInterface.listFilePaths(filePath.toString()).stream().filter( + s -> surveyRawData.getIdSurveyUnits().contains(getIdFromFilename(Path.of(s))) + ).toList()){ + ParaDataUE paraDataUE = new ParaDataUE(); + paraDataUE.setFilepath(Path.of(fileParaDataPath)); + parseParadataUE(paraDataUE, surveyRawData); + paraDataUE.sortEvents(); + paraDataUE.setSurveyValidationDateTimeStamp(Constants.PARADATA_SURVEY_VALIDATION_EVENT_NAME); + if (paraDataUE.getEvents().size() > 2) { + paraDataUE.createOrchestratorsAndSessions(); + integrateParaDataVariablesIntoUE(paraDataUE, surveyRawData); + listParaDataUE.add(paraDataUE); } - paradata.setListParadataUE(listParaDataUE); - } catch (Exception e) { - log.error(e.getMessage()); } + paradata.setListParadataUE(listParaDataUE); } - } private String getIdFromFilename(Path file) { @@ -134,7 +134,7 @@ private JSONObject getParadataFromJson(ParaDataUE paradataUE) throws NullExcepti Path filePath = paradataUE.getFilepath(); JSONObject jsonObject; try { - jsonObject = (JSONObject) Constants.readJsonSimple(filePath); + jsonObject = (JSONObject) Constants.readJsonSimple(filePath, fileUtilsInterface); } catch (Exception e) { throw new NullException("Can't read JSON file - " + e.getClass() + " " + e.getMessage()); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/CSVReportingDataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/CSVReportingDataParser.java index 57dadf8d..5da311e8 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/CSVReportingDataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/CSVReportingDataParser.java @@ -1,8 +1,8 @@ package fr.insee.kraftwerk.core.extradata.reportingdata; -import java.io.FileNotFoundException; -import java.io.FileReader; import java.io.IOException; +import java.io.InputStream; +import java.io.InputStreamReader; import java.nio.file.Path; import java.text.ParseException; import java.text.SimpleDateFormat; @@ -18,6 +18,7 @@ import fr.insee.kraftwerk.core.exceptions.NullException; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; @Log4j2 @@ -25,15 +26,14 @@ public class CSVReportingDataParser extends ReportingDataParser { private CSVReader csvReader; + public CSVReportingDataParser(FileUtilsInterface fileUtilsInterface) { + super(fileUtilsInterface); + } + public void parseReportingData(ReportingData reportingData, SurveyRawData data, boolean withAllReportingData) throws NullException { Path filePath = reportingData.getFilepath(); - try{ - readFile(filePath); - } catch (NullPointerException e) { - throw new NullException(); - } - - try { + try(InputStream inputStream = fileUtilsInterface.readFile(filePath.toString())){ + readFile(inputStream); String[] header = this.csvReader.readNext(); if (controlHeader(header)) { String[] nextRecord; @@ -56,7 +56,7 @@ public void parseReportingData(ReportingData reportingData, SurveyRawData data, reportingDataUE.addState(state); reportingData.addReportingDataUE(reportingDataUE); } - integrateReportingDataIntoUE(data, reportingData, withAllReportingData); + integrateReportingDataIntoUE(data, reportingData, withAllReportingData, fileUtilsInterface); } else { log.error("Following CSV file is malformed : {}", filePath); } @@ -95,14 +95,10 @@ public boolean controlHeader(String[] header) { && header[6].contentEquals("adresse") && header[7].contentEquals("numeroDeLot")); } - private void readFile(Path filePath) { - try { - FileReader filereader = new FileReader(filePath.toString()); - this.csvReader = new CSVReader(filereader); - CSVParser parser = (new CSVParserBuilder()).withSeparator(',').build(); - this.csvReader = (new CSVReaderBuilder(filereader)).withCSVParser(parser).build(); - } catch (FileNotFoundException e) { - log.error("Unable to find the file {}, FileNotFoundException {}", filePath, e); - } + private void readFile(InputStream inputStream) { + InputStreamReader inputStreamReader = new InputStreamReader(inputStream); + this.csvReader = new CSVReader(inputStreamReader); + CSVParser parser = (new CSVParserBuilder()).withSeparator(',').build(); + this.csvReader = (new CSVReaderBuilder(inputStreamReader)).withCSVParser(parser).build(); } } \ No newline at end of file diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/ReportingDataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/ReportingDataParser.java index 11047bb8..cd49960f 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/ReportingDataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/ReportingDataParser.java @@ -8,6 +8,7 @@ import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.utils.DateUtils; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import java.sql.Date; @@ -19,9 +20,15 @@ public abstract class ReportingDataParser { private int maxStates = 0; private int maxAttempts = 0; private int maxComments = 0; + protected FileUtilsInterface fileUtilsInterface; + + public ReportingDataParser(FileUtilsInterface fileUtilsInterface) { + this.fileUtilsInterface = fileUtilsInterface; + } protected void integrateReportingDataIntoUE(SurveyRawData surveyRawData, ReportingData reportingData, - boolean withAllReportingData) { + boolean withAllReportingData, FileUtilsInterface fileUtilsInterface) { + this.fileUtilsInterface = fileUtilsInterface; this.maxStates = countMaxStates(reportingData); this.maxAttempts = countMaxAttempts(reportingData); this.maxComments = countMaxComments(reportingData); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/XMLReportingDataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/XMLReportingDataParser.java index 0001b4b5..9051268f 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/XMLReportingDataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/XMLReportingDataParser.java @@ -4,6 +4,7 @@ import fr.insee.kraftwerk.core.exceptions.NullException; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.utils.XmlFileReader; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import nu.xom.Document; import nu.xom.Element; @@ -17,8 +18,12 @@ public class XMLReportingDataParser extends ReportingDataParser { private Document document; - - public void parseReportingData(ReportingData reportingData, SurveyRawData data, boolean withAllReportingData) throws NullException { + + public XMLReportingDataParser(FileUtilsInterface fileUtilsInterface) { + super(fileUtilsInterface); + } + + public void parseReportingData(ReportingData reportingData, SurveyRawData data, boolean withAllReportingData) throws NullException { Path filePath = reportingData.getFilepath(); readFile(filePath); Element root; @@ -98,13 +103,13 @@ public void parseReportingData(ReportingData reportingData, SurveyRawData data, reportingData.addReportingDataUE(reportingDataUE); } - integrateReportingDataIntoUE(data, reportingData, withAllReportingData); + integrateReportingDataIntoUE(data, reportingData, withAllReportingData, fileUtilsInterface); this.document = null; } private void readFile(Path filePath) { - XmlFileReader xmlFileReader = new XmlFileReader(); + XmlFileReader xmlFileReader = new XmlFileReader(fileUtilsInterface); this.document = xmlFileReader.readXmlFile(filePath); if (this.document != null) { log.info("Successfully parsed Coleman/Moog answers file: " + filePath); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java index 6dace939..8994224d 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java @@ -106,12 +106,8 @@ private String readField(JsonNode node, String field) throws MissingMandatoryFie * @return Path of the DDI file * @throws IOException – if an I/O error is thrown when accessing the starting file */ - public Path findDDIFile(Path specDirectory) throws KraftwerkException, IOException { - //TODO Change to interface - try (Stream files = Files.find(specDirectory, 1, (path, basicFileAttributes) -> path.toFile().getName().toLowerCase().matches("ddi[\\w,\\s-]+\\.xml"))) { - return files.findFirst() - .orElseThrow(() -> new KraftwerkException(404, "No DDI file (ddi*.xml) found in " + specDirectory.toString())); - } + public Path findDDIFile(Path specDirectory) throws KraftwerkException { + return Path.of(fileUtilsInterface.findFile(String.valueOf(specDirectory),Constants.DDI_FILE_REGEX)); } /** @@ -120,10 +116,7 @@ public Path findDDIFile(Path specDirectory) throws KraftwerkException, IOExcepti * @return Path of the Lunatic file * @throws IOException – if an I/O error is thrown when accessing the starting file */ - public Path findLunaticFile(Path specDirectory) throws KraftwerkException, IOException { - try (Stream files = Files.find(specDirectory, 1, (path, basicFileAttributes) -> path.toFile().getName().toLowerCase().matches("lunatic[\\w,\\s-]+\\.json"))) { - return files.findFirst() - .orElseThrow(() -> new KraftwerkException(404, "No Lunatic file (lunatic*.xml) found in " + specDirectory.toString())); - } + public Path findLunaticFile(Path specDirectory) throws KraftwerkException { + return Path.of(fileUtilsInterface.findFile(String.valueOf(specDirectory),Constants.LUNATIC_FILE_REGEX)); } } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java index 9600f71c..897df7c3 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java @@ -2,6 +2,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.xsl.SaxonTransformer; import lombok.extern.log4j.Log4j2; import org.apache.commons.lang3.StringUtils; @@ -17,6 +18,7 @@ import javax.xml.parsers.ParserConfigurationException; import java.io.File; import java.io.IOException; +import java.io.InputStream; import java.net.MalformedURLException; import java.net.URL; import java.nio.file.Files; @@ -43,7 +45,7 @@ private DDIReader() { * @return The variables found in the DDI. * @throws KraftwerkException */ - public static MetadataModel getMetadataFromDDI(URL ddiUrl) throws KraftwerkException { + public static MetadataModel getMetadataFromDDI(URL ddiUrl, FileUtilsInterface fileUtilsInterface) throws KraftwerkException { try { // Path of the output 'variables.xml' temp file @@ -53,8 +55,7 @@ public static MetadataModel getMetadataFromDDI(URL ddiUrl) throws KraftwerkExcep transformDDI(ddiUrl, variablesTempFilePath); - MetadataModel metadataModel = readVariables(variablesTempFilePath); - //TODO change to use interface + MetadataModel metadataModel = readVariables(variablesTempFilePath, fileUtilsInterface); Files.delete(variablesFile.toPath()); return metadataModel; } @@ -93,12 +94,12 @@ private static void transformDDI(URL ddiUrl, Path variablesFilePath) { * @throws SAXException * @throws ParserConfigurationException */ - private static MetadataModel readVariables(Path variablesFilePath) + private static MetadataModel readVariables(Path variablesFilePath, FileUtilsInterface fileUtilsInterface) throws KraftwerkException, SAXException, IOException, ParserConfigurationException { MetadataModel metadataModel = new MetadataModel(); // Parse - Element root = readXmlFile(variablesFilePath); + Element root = readXmlFile(variablesFilePath, fileUtilsInterface); // Get XML groups NodeList groupElements = root.getChildNodes(); @@ -231,10 +232,8 @@ private static void addValues(UcqVariable variable, NodeList valueElements) { private static boolean nodeIsElementWithName(Node groupNode, String name) { return name.equals(groupNode.getNodeName()) && groupNode.getNodeType() == Node.ELEMENT_NODE; } - - private static Element readXmlFile(Path variablesFilePath) + private static Element readXmlFile(Path variablesFilePath, FileUtilsInterface fileUtilsInterface) throws ParserConfigurationException, SAXException, IOException, KraftwerkException { - File file = variablesFilePath.toFile(); System.setProperty("javax.xml.parsers.DocumentBuilderFactory", "com.sun.org.apache.xerces.internal.jaxp.DocumentBuilderFactoryImpl"); DocumentBuilderFactory factory = DocumentBuilderFactory.newInstance(); @@ -242,11 +241,12 @@ private static Element readXmlFile(Path variablesFilePath) factory.setAttribute(XMLConstants.ACCESS_EXTERNAL_DTD, ""); factory.setAttribute(XMLConstants.ACCESS_EXTERNAL_SCHEMA, ""); DocumentBuilder builder = factory.newDocumentBuilder(); - Document document = builder.parse(file); - if (document == null) - throw new KraftwerkException(500, "Can't read DDI - DDI is null"); - - return document.getDocumentElement(); + try(InputStream inputStream = fileUtilsInterface.readFile(variablesFilePath.toString())){ + Document document = builder.parse(inputStream); + if (document == null) + throw new KraftwerkException(500, "Can't read DDI - DDI is null"); + return document.getDocumentElement(); + } } private static String getFirstChildValue(Element variableElement, String childTagName) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtils.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtils.java index 9def414a..09c0f8b5 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtils.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtils.java @@ -3,6 +3,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.inputs.ModeInputs; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import java.util.LinkedHashMap; @@ -16,17 +17,17 @@ private MetadataUtils(){ throw new IllegalStateException("Utility class"); } - public static Map getMetadata(Map modeInputsMap){ + public static Map getMetadata(Map modeInputsMap, FileUtilsInterface fileUtilsInterface){ Map metadataModels = new LinkedHashMap<>(); - modeInputsMap.forEach((k, v) -> putToMetadataModels(k,v,metadataModels)); + modeInputsMap.forEach((k, v) -> putToMetadataModels(k,v,metadataModels, fileUtilsInterface)); return metadataModels; } - private static void putToMetadataModels(String dataMode, ModeInputs modeInputs, Map metadataModels ) { + private static void putToMetadataModels(String dataMode, ModeInputs modeInputs, Map metadataModels, FileUtilsInterface fileUtilsInterface) { // Step 1 : we add the variables read in the DDI MetadataModel metadataModel = new MetadataModel(); try { - metadataModel = DDIReader.getMetadataFromDDI(modeInputs.getDdiUrl()); + metadataModel = DDIReader.getMetadataFromDDI(modeInputs.getDdiUrl(), fileUtilsInterface); } catch (KraftwerkException e) { log.error(e.getMessage()); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtilsGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtilsGenesis.java index 62f04f0e..e6be34bc 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtilsGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtilsGenesis.java @@ -3,6 +3,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.inputs.ModeInputs; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import java.util.LinkedHashMap; @@ -16,19 +17,19 @@ private MetadataUtilsGenesis() { throw new IllegalStateException("Utility class"); } - public static Map getMetadata(Map modeInputsMap) throws KraftwerkException { + public static Map getMetadata(Map modeInputsMap, FileUtilsInterface fileUtilsInterface) throws KraftwerkException { Map metadataModels = new LinkedHashMap<>(); for (Map.Entry entry : modeInputsMap.entrySet()) { String k = entry.getKey(); ModeInputs v = entry.getValue(); - putToMetadataVariable(k, v, metadataModels); + putToMetadataVariable(k, v, metadataModels, fileUtilsInterface); } return metadataModels; } - private static void putToMetadataVariable(String dataMode, ModeInputs modeInputsGenesis, Map metadataModels ) throws KraftwerkException { + private static void putToMetadataVariable(String dataMode, ModeInputs modeInputsGenesis, Map metadataModels, FileUtilsInterface fileUtilsInterface) throws KraftwerkException { // Step 1 : we add the variables read in the DDI - MetadataModel metadataModel = DDIReader.getMetadataFromDDI(modeInputsGenesis.getDdiUrl()); + MetadataModel metadataModel = DDIReader.getMetadataFromDDI(modeInputsGenesis.getDdiUrl(), fileUtilsInterface); // Step 2 : we add the variables that are only present in the Lunatic file if (modeInputsGenesis.getLunaticFile() != null) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java index 55efe3bb..34097fd4 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java @@ -5,6 +5,7 @@ import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.Getter; import lombok.extern.slf4j.Slf4j; @@ -28,6 +29,7 @@ public abstract class OutputFiles { private final VtlBindings vtlBindings; private final Set datasetToCreate = new HashSet<>(); private final Statement database; + private final FileUtilsInterface fileUtilsInterface; /** * When an instance is created, the output folder is created. @@ -35,12 +37,13 @@ public abstract class OutputFiles { * @param outDirectory Out directory defined in application properties. * @param vtlBindings Vtl bindings where datasets are stored. */ - protected OutputFiles(Path outDirectory, VtlBindings vtlBindings, List modes, Statement database) { + protected OutputFiles(Path outDirectory, VtlBindings vtlBindings, List modes, Statement database, FileUtilsInterface fileUtilsInterface) { this.vtlBindings = vtlBindings; setOutputDatasetNames(modes); outputFolder = outDirectory; createOutputFolder(); this.database = database; + this.fileUtilsInterface = fileUtilsInterface; } /** Create output folder if doesn't exist. */ diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java index 75d97513..43837c12 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java @@ -9,6 +9,7 @@ import fr.insee.kraftwerk.core.outputs.TableScriptInfo; import fr.insee.kraftwerk.core.utils.SqlUtils; import fr.insee.kraftwerk.core.utils.TextFileWriter; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.log.KraftwerkExecutionLog; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.extern.slf4j.Slf4j; @@ -39,12 +40,12 @@ public class CsvOutputFiles extends OutputFiles { * @param outDirectory Out directory defined in application properties. * @param vtlBindings Vtl bindings where datasets are stored. */ - public CsvOutputFiles(Path outDirectory, VtlBindings vtlBindings, List modes, Statement database) { - super(outDirectory, vtlBindings, modes, database); + public CsvOutputFiles(Path outDirectory, VtlBindings vtlBindings, List modes, Statement database, FileUtilsInterface fileUtilsInterface) { + super(outDirectory, vtlBindings, modes, database, fileUtilsInterface); this.kraftwerkExecutionLog = null; } - public CsvOutputFiles(Path outDirectory, VtlBindings vtlBindings, KraftwerkExecutionLog kraftwerkExecutionLog, List modes, Statement database) { - super(outDirectory, vtlBindings, modes, database); + public CsvOutputFiles(Path outDirectory, VtlBindings vtlBindings, KraftwerkExecutionLog kraftwerkExecutionLog, List modes, Statement database, FileUtilsInterface fileUtilsInterface) { + super(outDirectory, vtlBindings, modes, database, fileUtilsInterface); this.kraftwerkExecutionLog = kraftwerkExecutionLog; } @@ -109,6 +110,8 @@ public void writeOutputTables(Map metadataModels) throws kraftwerkExecutionLog.getLineCountByTableMap().put(datasetName, countResult.getInt(1)); } } + + //TODO export to minio } catch (SQLException | IOException e) { throw new KraftwerkException(500, e.toString()); } @@ -170,9 +173,9 @@ public void writeImportScripts(Map metadataModels, List nbParquetFilesbyDataset = new HashMap<>(); + /** * When an instance is created, the output folder is created. - * + * * @param outDirectory Out directory defined in application properties. * @param vtlBindings Vtl bindings where datasets are stored. + * @param modes list of modes names + * @param databaseConnection connection to duckDb database + * @param fileUtilsInterface file interface to use (file system or minio) */ - - private Map nbParquetFilesbyDataset = new HashMap<>(); - - public ParquetOutputFiles(Path outDirectory, VtlBindings vtlBindings, List modes, Statement databaseConnection) { - super(outDirectory, vtlBindings, modes, databaseConnection); + public ParquetOutputFiles(Path outDirectory, VtlBindings vtlBindings, List modes, Statement databaseConnection, FileUtilsInterface fileUtilsInterface) { + super(outDirectory, vtlBindings, modes, databaseConnection, fileUtilsInterface); } @@ -53,6 +57,7 @@ public void writeOutputTables(Map metadataModels) throws Files.deleteIfExists(outputFile.toPath()); //Data export getDatabase().execute(String.format("COPY %s TO '%s' (FORMAT PARQUET)", datasetName, outputFile.getAbsolutePath())); + //TODO export to minio } catch (Exception e) { throw new KraftwerkException(500, e.toString()); @@ -75,7 +80,7 @@ public void writeImportScripts(Map metadataModels, List stream = Files.list(dataPath)){ - stream.forEach(t -> { - try { - parseDataFile(t); - if(kraftwerkExecutionLog != null) { - kraftwerkExecutionLog.getOkFileNames().add(t.getFileName().toString()); - } - } catch (NullException e) { - log.error("IOException occurred when trying to list data file: {} in folder {}", t, dataPath); + if(Boolean.TRUE.equals(fileUtilsInterface.isDirectory(dataPath.toString()))){ + for(String path : fileUtilsInterface.listFilePaths(String.valueOf(dataPath))){ + try { + parseDataFile(Path.of(path)); + if(kraftwerkExecutionLog != null) { + kraftwerkExecutionLog.getOkFileNames().add(Path.of(path).getFileName().toString()); } - }); - } catch (IOException e) { - log.error(String.format("IOException occurred when trying to list data files of folder: %s", dataPath)); + } catch (NullException e) { + log.error("IOException occurred when trying to list data file: {} in folder {}", path, dataPath); + } } } - - else { - log.warn(String.format("Data path given could not be identified as a file or folder: %s", dataPath)); - log.warn("No data was parsed."); - } - } /** @@ -84,35 +77,28 @@ public final void parseSurveyDataWithoutDDI(Path dataPath, Path lunaticFile, Kra log.error(DATAPATH_IS_NULL); throw new NullException(DATAPATH_IS_NULL); } - if (Files.isRegularFile(dataPath)) { + if(fileUtilsInterface.isDirectory(dataPath.toString()) == null){ + log.warn(String.format("Data path given could not be identified as a file or folder: %s", dataPath)); + log.warn("No data was parsed."); + } + if(Boolean.FALSE.equals(fileUtilsInterface.isDirectory(dataPath.toString()))) { parseDataFileWithoutDDI(dataPath,lunaticFile); if(kraftwerkExecutionLog != null) { kraftwerkExecutionLog.getOkFileNames().add(dataPath.getFileName().toString()); } } - - else if (Files.isDirectory(dataPath)) { - try (Stream stream = Files.list(dataPath)){ - stream.forEach(t -> { - try { - parseDataFileWithoutDDI(t,lunaticFile); - if(kraftwerkExecutionLog != null) { - kraftwerkExecutionLog.getOkFileNames().add(t.getFileName().toString()); - } - } catch (NullException e) { - log.error("IOException occurred when trying to list data file: {} in folder {}", t, dataPath); + if(Boolean.TRUE.equals(fileUtilsInterface.isDirectory(dataPath.toString()))) { + for(String path : fileUtilsInterface.listFilePaths(dataPath.toString())){ + try { + parseDataFileWithoutDDI(Path.of(path),lunaticFile); + if(kraftwerkExecutionLog != null) { + kraftwerkExecutionLog.getOkFileNames().add(Path.of(path).getFileName().toString()); } - }); - } catch (IOException e) { - log.error(String.format("IOException occurred when trying to list data files of folder: %s", dataPath)); + } catch (NullException e) { + log.error("IOException occurred when trying to list data file: {} in folder {}", path, dataPath); + } } } - - else { - log.warn(String.format("Data path given could not be identified as a file or folder: %s", dataPath)); - log.warn("No data was parsed."); - } - } /** diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParserManager.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParserManager.java index 59036010..e0a43222 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParserManager.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParserManager.java @@ -1,6 +1,7 @@ package fr.insee.kraftwerk.core.parsers; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; /** @@ -22,12 +23,12 @@ private DataParserManager(){ * @return * One of the concrete parsers. */ - public static DataParser getParser(DataFormat dataFormat, SurveyRawData data) { + public static DataParser getParser(DataFormat dataFormat, SurveyRawData data, FileUtilsInterface fileUtilsInterface) { return switch (dataFormat) { - case XFORMS -> new XformsDataParser(data); - case PAPER -> new PaperDataParser(data); - case LUNATIC_XML -> new LunaticXmlDataParser(data); - case LUNATIC_JSON -> new LunaticJsonDataParser(data); + case XFORMS -> new XformsDataParser(data, fileUtilsInterface); + case PAPER -> new PaperDataParser(data, fileUtilsInterface); + case LUNATIC_XML -> new LunaticXmlDataParser(data, fileUtilsInterface); + case LUNATIC_JSON -> new LunaticJsonDataParser(data,fileUtilsInterface); default -> { log.debug(String.format("Unknown data format: %s", dataFormat)); throw new IllegalArgumentException(String.format("Unknown data format: %s", dataFormat)); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticJsonDataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticJsonDataParser.java index 2b1162e6..0403623c 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticJsonDataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticJsonDataParser.java @@ -5,6 +5,7 @@ import fr.insee.kraftwerk.core.rawdata.GroupInstance; import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import org.json.simple.JSONObject; @@ -18,8 +19,8 @@ public class LunaticJsonDataParser extends DataParser { * @param data The SurveyRawData to be filled by the parseSurveyData method. * The variables must have been previously set. */ - public LunaticJsonDataParser(SurveyRawData data) { - super(data); + public LunaticJsonDataParser(SurveyRawData data, FileUtilsInterface fileUtilsInterface) { + super(data,fileUtilsInterface); } @Override @@ -27,9 +28,10 @@ void parseDataFile(Path filePath) throws NullException { log.warn("Lunatic data parser being implemented!"); // - JSONObject jsonObject = null; + JSONObject jsonObject; + try { - jsonObject = (JSONObject) Constants.readJsonSimple(filePath); + jsonObject = (JSONObject) Constants.readJsonSimple(filePath, fileUtilsInterface); } catch (Exception e) { throw new NullException("Can't read JSON file - "+e.getClass()+" "+ e.getMessage()); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java index 7c6564fa..17d83365 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java @@ -7,6 +7,7 @@ import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.utils.XmlFileReader; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import nu.xom.Document; import nu.xom.Element; @@ -33,8 +34,8 @@ public class LunaticXmlDataParser extends DataParser { * @param data The SurveyRawData to be filled by the parseSurveyData method. The * variables must have been previously set. */ - public LunaticXmlDataParser(SurveyRawData data) { - super(data); + public LunaticXmlDataParser(SurveyRawData data, FileUtilsInterface fileUtilsInterface) { + super(data, fileUtilsInterface); } /** @@ -44,7 +45,7 @@ public LunaticXmlDataParser(SurveyRawData data) { * @return The parsed document. */ private Document readXmlFile(Path filePath) { - XmlFileReader xmlFileReader = new XmlFileReader(); + XmlFileReader xmlFileReader = new XmlFileReader(fileUtilsInterface); Document document = xmlFileReader.readXmlFile(filePath); if (document == null) { log.warn("Failed to parse Lunatic answers file: " + filePath); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/PaperDataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/PaperDataParser.java index 21047f43..c421b017 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/PaperDataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/PaperDataParser.java @@ -13,11 +13,12 @@ import fr.insee.kraftwerk.core.rawdata.GroupInstance; import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; -import java.io.FileNotFoundException; -import java.io.FileReader; import java.io.IOException; +import java.io.InputStream; +import java.io.InputStreamReader; import java.nio.file.Path; import java.util.Arrays; import java.util.HashMap; @@ -32,8 +33,8 @@ @Log4j2 public class PaperDataParser extends DataParser { - /** File reader */ - private FileReader filereader; + /** Input stream reader */ + private InputStreamReader inputStreamReader; /** Csv reader */ private CSVReader csvReader; @@ -43,45 +44,38 @@ public class PaperDataParser extends DataParser { * @param data The SurveyRawData to be filled by the parseSurveyData method. The * variables must have been previously set. */ - public PaperDataParser(SurveyRawData data) { - super(data); + public PaperDataParser(SurveyRawData data, FileUtilsInterface fileUtilsInterface) { + super(data, fileUtilsInterface); } /** * Instantiate a CSVReader. * - * @param filePath Path to the CSV file. + * @param inputStream stream to the CSV file. */ - private void readCsvFile(Path filePath) { - try { - // Create an object of file reader - // class with CSV file as a parameter. - filereader = new FileReader(filePath.toString()); - // create csvReader object passing - // file reader as a parameter - csvReader = new CSVReader(filereader); - - // create csvParser object with - // custom separator semicolon - CSVParser parser = new CSVParserBuilder().withSeparator(Constants.CSV_PAPER_DATA_SEPARATOR).build(); - - // create csvReader object with parameter - // file reader and parser - csvReader = new CSVReaderBuilder(filereader) - // .withSkipLines(1) // (uncomment to ignore header) - .withCSVParser(parser).build(); - - } catch (FileNotFoundException e) { - log.error(String.format("Unable to find the file %s", filePath), e); - } + private void readCsvFileStream(InputStream inputStream) { + // Create an object of file reader + // class with CSV file as a parameter. + inputStreamReader = new InputStreamReader(inputStream); + // create csvReader object passing + // file reader as a parameter + csvReader = new CSVReader(inputStreamReader); + + // create csvParser object with + // custom separator semicolon + CSVParser parser = new CSVParserBuilder().withSeparator(Constants.CSV_PAPER_DATA_SEPARATOR).build(); + + // create csvReader object with parameter + // file reader and parser + csvReader = new CSVReaderBuilder(inputStreamReader) + // .withSkipLines(1) // (uncomment to ignore header) + .withCSVParser(parser).build(); } @Override void parseDataFile(Path filePath) { - - readCsvFile(filePath); - - try { + try(InputStream inputStream = fileUtilsInterface.readFile(filePath.toString())){ + readCsvFileStream(inputStream); /* * We first map the variables in the header (first line) of the CSV file to the @@ -161,7 +155,6 @@ void parseDataFile(Path filePath) { } data.addQuestionnaire(questionnaireData); } - filereader.close(); csvReader.close(); } catch (CsvValidationException e) { log.error(String.format("Following CSV file is malformed: %s", filePath), e); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/XformsDataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/XformsDataParser.java index af2d6b9f..89f8df35 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/XformsDataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/XformsDataParser.java @@ -5,6 +5,7 @@ import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.utils.XmlFileReader; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import nu.xom.Document; import nu.xom.Element; @@ -23,8 +24,8 @@ public class XformsDataParser extends DataParser { * @param data The SurveyRawData to be filled by the parseSurveyData method. * The variables must have been previously set. */ - public XformsDataParser(SurveyRawData data) { - super(data); + public XformsDataParser(SurveyRawData data, FileUtilsInterface fileUtilsInterface) { + super(data, fileUtilsInterface); } /** @@ -33,7 +34,7 @@ public XformsDataParser(SurveyRawData data) { * @return The parsed document. */ private Document readXmlFile(Path filePath) { - XmlFileReader xmlFileReader = new XmlFileReader(); + XmlFileReader xmlFileReader = new XmlFileReader(fileUtilsInterface); Document document = xmlFileReader.readXmlFile(filePath); if (document != null) { log.info("Successfully parsed Xforms answers file: " + filePath); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequence.java index aa6a6012..29a57d24 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequence.java @@ -13,6 +13,7 @@ import fr.insee.kraftwerk.core.parsers.DataParser; import fr.insee.kraftwerk.core.parsers.DataParserManager; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.log.KraftwerkExecutionLog; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; @@ -25,10 +26,12 @@ public class BuildBindingsSequence { VtlExecute vtlExecute; private final boolean withAllReportingData; + private final FileUtilsInterface fileUtilsInterface; - public BuildBindingsSequence(boolean withAllReportingData) { - vtlExecute = new VtlExecute(); + public BuildBindingsSequence(boolean withAllReportingData, FileUtilsInterface fileUtilsInterface) { + vtlExecute = new VtlExecute(fileUtilsInterface); this.withAllReportingData = withAllReportingData; + this.fileUtilsInterface = fileUtilsInterface; } public void buildVtlBindings(UserInputsFile userInputsFile, String dataMode, VtlBindings vtlBindings, MetadataModel metadataModel, boolean withDDI, KraftwerkExecutionLog kraftwerkExecutionLog) throws KraftwerkException { @@ -40,7 +43,7 @@ public void buildVtlBindings(UserInputsFile userInputsFile, String dataMode, Vtl /* Step 2.1 : Fill the data object with the survey answers file */ data.setDataFilePath(modeInputs.getDataFile()); - DataParser parser = DataParserManager.getParser(modeInputs.getDataFormat(), data); + DataParser parser = DataParserManager.getParser(modeInputs.getDataFormat(), data, fileUtilsInterface); log.info("Parsing survey data file " + modeInputs.getDataFile().getFileName()); if (withDDI) { parser.parseSurveyData(modeInputs.getDataFile(),kraftwerkExecutionLog); @@ -62,7 +65,7 @@ public void buildVtlBindings(UserInputsFile userInputsFile, String dataMode, Vtl private void parseParadata(ModeInputs modeInputs, SurveyRawData data) throws NullException { Path paraDataFolder = modeInputs.getParadataFolder(); if (paraDataFolder != null) { - ParadataParser paraDataParser = new ParadataParser(); + ParadataParser paraDataParser = new ParadataParser(fileUtilsInterface); Paradata paraData = new Paradata(paraDataFolder); paraDataParser.parseParadata(paraData, data); } @@ -73,11 +76,11 @@ private void parseReportingData(ModeInputs modeInputs, SurveyRawData data) throw if (reportingDataFile != null) { ReportingData reportingData = new ReportingData(reportingDataFile); if (reportingDataFile.toString().contains(".xml")) { - XMLReportingDataParser xMLReportingDataParser = new XMLReportingDataParser(); + XMLReportingDataParser xMLReportingDataParser = new XMLReportingDataParser(fileUtilsInterface); xMLReportingDataParser.parseReportingData(reportingData, data, withAllReportingData); } else if (reportingDataFile.toString().contains(".csv")) { - CSVReportingDataParser cSVReportingDataParser = new CSVReportingDataParser(); + CSVReportingDataParser cSVReportingDataParser = new CSVReportingDataParser(fileUtilsInterface); cSVReportingDataParser.parseReportingData(reportingData, data, withAllReportingData); } } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java index 3f7db455..c931078a 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java @@ -29,12 +29,14 @@ public class BuildBindingsSequenceGenesis { VtlExecute vtlExecute; + FileUtilsInterface fileUtilsInterface; - public BuildBindingsSequenceGenesis() { - vtlExecute = new VtlExecute(); + public BuildBindingsSequenceGenesis(FileUtilsInterface fileUtilsInterface) { + vtlExecute = new VtlExecute(fileUtilsInterface); + this.fileUtilsInterface = fileUtilsInterface; } - public void buildVtlBindings(String dataMode, VtlBindings vtlBindings, Map metadataModels, List surveyUnits, Path inDirectory, Statement database, FileUtilsInterface fileUtilsInterface) throws KraftwerkException, NullException { + public void buildVtlBindings(String dataMode, VtlBindings vtlBindings, Map metadataModels, List surveyUnits, Path inDirectory, Statement database) throws KraftwerkException, NullException { SurveyRawData data = new SurveyRawData(); /* Step 2.0 : Read the DDI file (and Lunatic Json for missing variables) to get survey variables */ @@ -71,7 +73,7 @@ public void buildVtlBindings(String dataMode, VtlBindings vtlBindings, Map modeInputsMap, Map metadataModels, List errors, Statement database) throws KraftwerkException { + public void writeOutputFiles(Path inDirectory, + LocalDateTime executionDateTime, + VtlBindings vtlBindings, + Map modeInputsMap, + Map metadataModels, + List errors, Statement database, + FileUtilsInterface fileUtilsInterface) throws KraftwerkException { Path outDirectory = FileUtilsInterface.transformToOut(inDirectory,executionDateTime); - writeOutputFiles(inDirectory, executionDateTime,vtlBindings, modeInputsMap, metadataModels, errors, null, database); - writeParquetFiles(outDirectory, vtlBindings, modeInputsMap, metadataModels, errors, database); + writeOutputFiles(inDirectory, executionDateTime,vtlBindings, modeInputsMap, metadataModels, errors, null, database, fileUtilsInterface); + writeParquetFiles(outDirectory, vtlBindings, modeInputsMap, metadataModels, errors, database, fileUtilsInterface); } - public void writeOutputFiles(Path inDirectory, LocalDateTime localDateTime, VtlBindings vtlBindings, Map modeInputsMap, Map metadataModels, List errors, KraftwerkExecutionLog kraftwerkExecutionLog, Statement databaseConnection) throws KraftwerkException { + public void writeOutputFiles(Path inDirectory, + LocalDateTime localDateTime, + VtlBindings vtlBindings, + Map modeInputsMap, + Map metadataModels, + List errors, + KraftwerkExecutionLog kraftwerkExecutionLog, + Statement databaseConnection, + FileUtilsInterface fileUtilsInterface) throws KraftwerkException { Path outDirectory = FileUtilsInterface.transformToOut(inDirectory,localDateTime); /* Step 4.1 : write csv output tables */ - OutputFiles csvOutputFiles = new CsvOutputFiles(outDirectory, vtlBindings, kraftwerkExecutionLog, new ArrayList<>(modeInputsMap.keySet()), databaseConnection); + OutputFiles csvOutputFiles = new CsvOutputFiles(outDirectory, vtlBindings, kraftwerkExecutionLog, new ArrayList<>(modeInputsMap.keySet()), databaseConnection, fileUtilsInterface); csvOutputFiles.writeOutputTables(metadataModels); -//TODO change to use interface /* Step 4.2 : write scripts to import csv tables in several languages */ csvOutputFiles.writeImportScripts(metadataModels, errors); } //Write Parquet - private void writeParquetFiles(Path outDirectory, VtlBindings vtlBindings, Map modeInputsMap, Map metadataModels, List errors, Statement databaseConnection) throws KraftwerkException { + private void writeParquetFiles(Path outDirectory, VtlBindings vtlBindings, Map modeInputsMap, Map metadataModels, List errors, Statement databaseConnection, FileUtilsInterface fileUtilsInterface) throws KraftwerkException { /* Step 4.3 : write parquet output tables */ - OutputFiles parquetOutputFiles = new ParquetOutputFiles(outDirectory, vtlBindings, new ArrayList<>(modeInputsMap.keySet()), databaseConnection); + OutputFiles parquetOutputFiles = new ParquetOutputFiles(outDirectory, vtlBindings, new ArrayList<>(modeInputsMap.keySet()), databaseConnection, fileUtilsInterface); parquetOutputFiles.writeOutputTables(metadataModels); parquetOutputFiles.writeImportScripts(metadataModels, errors); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/CsvUtils.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/CsvUtils.java index e04f1767..12e220de 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/CsvUtils.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/CsvUtils.java @@ -1,10 +1,10 @@ package fr.insee.kraftwerk.core.utils; -import java.io.FileReader; import java.io.FileWriter; import java.io.IOException; +import java.io.InputStream; +import java.io.InputStreamReader; import java.nio.charset.StandardCharsets; -import java.nio.file.Path; import com.opencsv.CSVParser; import com.opencsv.CSVParserBuilder; @@ -17,28 +17,28 @@ /** Encapsulate org.opencsv features that we use in Kraftwerk. */ public class CsvUtils { - + //TODO make it work with Minio private CsvUtils() { //Utility class } - public static CSVReader getReader(Path filePath) throws IOException { + public static CSVReader getReader(InputStream inputStream){ CSVParser parser = new CSVParserBuilder() .withSeparator(Constants.CSV_OUTPUTS_SEPARATOR) //.withQuoteChar(Constants.CSV_OUTPUTS_QUOTE_CHAR) //.withEscapeChar(CSVWriter.DEFAULT_ESCAPE_CHARACTER) .build(); - return new CSVReaderBuilder(new FileReader(filePath.toFile(), StandardCharsets.UTF_8)) + return new CSVReaderBuilder(new InputStreamReader(inputStream, StandardCharsets.UTF_8)) //.withSkipLines(1) // (uncomment to ignore header) .withCSVParser(parser) .build(); } - public static CSVReader getReaderWithSeparator(String filePath, char separator) throws IOException { + public static CSVReader getReaderWithSeparator(InputStream inputStream, char separator){ CSVParser csvParser= new CSVParserBuilder() .withSeparator(separator) .build(); - return new CSVReaderBuilder(new FileReader(filePath, StandardCharsets.UTF_8)) + return new CSVReaderBuilder(new InputStreamReader(inputStream, StandardCharsets.UTF_8)) .withCSVParser(csvParser) .build(); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileReader.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileReader.java index d177ba28..7cddcbd5 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileReader.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileReader.java @@ -1,11 +1,13 @@ package fr.insee.kraftwerk.core.utils; import java.io.BufferedReader; -import java.io.FileReader; import java.io.IOException; +import java.io.InputStream; +import java.io.InputStreamReader; import java.io.Reader; import java.nio.file.Path; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; @Log4j2 @@ -26,10 +28,10 @@ private TextFileReader(){ * @return * The content of the file in a string. */ - public static String readFromPath(Path filePath){ - try { - FileReader fileReader = new FileReader(filePath.toFile()); - return readTextContent(fileReader); + public static String readFromPath(Path filePath, FileUtilsInterface fileUtilsInterface){ + try (InputStream inputStream = fileUtilsInterface.readFile(filePath.toString())){ + InputStreamReader inputStreamReader = new InputStreamReader(inputStream); + return readTextContent(inputStreamReader); } catch (IOException e) { log.warn(String.format("Unable to read the text file %s.", filePath), e); @@ -37,14 +39,14 @@ public static String readFromPath(Path filePath){ } } - public static String readTextContent(Reader fileReader) throws IOException { - BufferedReader br = new BufferedReader(fileReader); + public static String readTextContent(Reader inputStreamReader) throws IOException { + BufferedReader br = new BufferedReader(inputStreamReader); StringBuilder content = new StringBuilder(); String line; while ((line = br.readLine()) != null) { content.append(line); } - fileReader.close(); + inputStreamReader.close(); br.close(); return content.toString(); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java index 9f0f2f78..400317b0 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java @@ -1,6 +1,5 @@ package fr.insee.kraftwerk.core.utils; -import java.io.FileWriter; import java.io.IOException; import java.nio.file.Path; import java.time.LocalDateTime; @@ -29,44 +28,31 @@ private TextFileWriter() { * @param filePath Path to the file. * @param fileContent Content of the text file. */ - public static void writeFile(Path filePath, String fileContent){ - try (FileWriter myWriter = new FileWriter(filePath.toFile())){ - myWriter.write(fileContent); - log.info(String.format("Text file: %s successfully written", filePath)); - } catch (IOException e) { - log.warn(String.format("Error occurred when trying to write text file: %s", filePath), e); - } - } + public static void writeFile(Path filePath, String fileContent, FileUtilsInterface fileUtilsInterface){ + fileUtilsInterface.writeFile(String.valueOf(filePath), fileContent, true); + log.info(String.format("Text file: %s successfully written", filePath)); + } - public static void writeErrorsFile(Path inDirectory, LocalDateTime localDateTime, List errors) { + public static void writeErrorsFile(Path inDirectory, LocalDateTime localDateTime, List errors, FileUtilsInterface fileUtilsInterface) { Path tempOutputPath = FileUtilsInterface.transformToOut(inDirectory,localDateTime) .resolve(Constants.ERRORS_FILE_NAME); FileSystemImpl.createDirectoryIfNotExist(tempOutputPath.getParent()); //Write errors file if (!errors.isEmpty()) { - try (FileWriter myWriter = new FileWriter(tempOutputPath.toFile(),true)){ - for (KraftwerkError error : errors){ - myWriter.write(error.toString()); - } - log.info(String.format("Text file: %s successfully written", tempOutputPath)); - } catch (IOException e) { - log.warn(String.format("Error occurred when trying to write text file: %s", tempOutputPath), e); + for (KraftwerkError error : errors) { + fileUtilsInterface.writeFile(tempOutputPath.toString(), error.toString(), false); } + log.info(String.format("Text file: %s successfully written", tempOutputPath)); } else { log.debug("No error found during VTL transformations"); } } - public static void writeLogFile(Path inDirectory, LocalDateTime localDateTime, KraftwerkExecutionLog kraftwerkExecutionLog){ + public static void writeLogFile(Path inDirectory, LocalDateTime localDateTime, KraftwerkExecutionLog kraftwerkExecutionLog, FileUtilsInterface fileUtilsInterface){ Path tempOutputPath = FileUtilsInterface.transformToOut(inDirectory,localDateTime); tempOutputPath = tempOutputPath.resolve(inDirectory.getFileName() + "_LOG_" + kraftwerkExecutionLog.getStartTimeStamp() +".txt"); - FileSystemImpl.createDirectoryIfNotExist(tempOutputPath.getParent()); - try (FileWriter myWriter = new FileWriter(tempOutputPath.toFile(),true)){ - myWriter.write(kraftwerkExecutionLog.getFormattedString()); - }catch (IOException e) { - log.warn(String.format("Error occurred when trying to write log file: %s", tempOutputPath), e); - } + fileUtilsInterface.writeFile(tempOutputPath.toString(), kraftwerkExecutionLog.getFormattedString(), false); } } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java index 0ecb43db..f5507761 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java @@ -16,6 +16,7 @@ import java.util.List; public class XMLSplitter { + //TODO Make it work with MinIO // We use StAX in this class to deal with memory issues on huge XML files private XMLSplitter() { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XmlFileReader.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XmlFileReader.java index ff41b980..85e9d35f 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XmlFileReader.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XmlFileReader.java @@ -1,9 +1,10 @@ package fr.insee.kraftwerk.core.utils; -import java.io.File; import java.io.IOException; +import java.io.InputStream; import java.nio.file.Path; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import nu.xom.Builder; import nu.xom.Document; @@ -18,12 +19,19 @@ public class XmlFileReader { private boolean xsdValidation = false; + private final FileUtilsInterface fileUtilsInterface; + + public XmlFileReader(FileUtilsInterface fileUtilsInterface) { + this.fileUtilsInterface = fileUtilsInterface; + } public Document readXmlFile(Path filePath) { - try { - File file = filePath.toFile(); + try (InputStream inputStream = fileUtilsInterface.readFile(filePath.toString())){ + if(inputStream == null){ + return null; + } Builder parser = new Builder(xsdValidation); - return parser.build(file); + return parser.build(inputStream); } catch (ValidityException ex) { log.warn("XSD validation error.", ex); log.warn("See following INFO log for details."); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index 5d73e154..b4dadd40 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -11,7 +11,11 @@ import javax.annotation.Nullable; import java.io.File; +import java.io.FileNotFoundException; +import java.io.FileOutputStream; import java.io.IOException; +import java.io.InputStream; +import java.io.OutputStream; import java.net.MalformedURLException; import java.net.URI; import java.net.URISyntaxException; @@ -72,100 +76,6 @@ public void archiveInputFiles(UserInputsFile userInputsFile) throws KraftwerkExc } } - /** - * If reporting data, we move reporting data files - * @param inputFolder - * @param campaignName - * @param modeInputs - * @throws KraftwerkException - */ - private void archiveReportingData(Path inputFolder, String campaignName, ModeInputs modeInputs) - throws KraftwerkException { - if (modeInputs.getReportingDataFile() != null) { - moveDirectory(modeInputs.getReportingDataFile().toFile(), inputFolder.resolve(ARCHIVE) - .resolve(getRoot(modeInputs.getReportingDataFile(), campaignName)).toFile()); - } - } - - /** - * If paradata, we move the paradata folder - * @param inputFolder - * @param campaignName - * @param modeInputs - * @throws KraftwerkException - */ - private void archiveParadata(Path inputFolder, String campaignName, ModeInputs modeInputs) - throws KraftwerkException { - if (modeInputs.getParadataFolder() != null) { - moveDirectory(modeInputs.getParadataFolder().toFile(), inputFolder.resolve(ARCHIVE) - .resolve(getRoot(modeInputs.getParadataFolder(), campaignName)).toFile()); - } - } - - private void archiveData(Path inputFolder, String campaignName, ModeInputs modeInputs) - throws KraftwerkException { - Path dataPath = modeInputs.getDataFile(); - Path newDataPath = inputFolder.resolve(ARCHIVE).resolve(getRoot(dataPath, campaignName)); - - if (!Files.exists(newDataPath)) { - new File(newDataPath.getParent().toString()).mkdirs(); - } - if (Files.isRegularFile(dataPath)) { - moveFile(dataPath, newDataPath); - } else if (Files.isDirectory(dataPath)) { - moveDirectory(dataPath.toFile(),newDataPath.toFile()); - } else { - log.debug(String.format("No file or directory at path: %s", dataPath)); - } - } - - private void createArchiveDirectoryIfNotExists(Path inputFolder) { - if (!Files.exists(inputFolder.resolve(ARCHIVE))) { - inputFolder.resolve(ARCHIVE).toFile().mkdir(); - } - } - - private void moveFile(Path dataPath, Path newDataPath) throws KraftwerkException { - try { - Files.move(dataPath, newDataPath); - } catch (IOException e) { - throw new KraftwerkException(500, "Can't move file " + dataPath + " to " + newDataPath); - } - } - - - private void moveDirectory(File sourceFile, File destFile) throws KraftwerkException { - if (sourceFile.isDirectory()) { - File[] files = sourceFile.listFiles(); - assert files != null : "List of files in sourceFile is null"; - for (File file : files) - moveDirectory(file, new File(destFile, file.getName())); - try { - Files.delete(sourceFile.toPath()); - } catch (IOException e) { - throw new KraftwerkException(500, "Can't delete " + sourceFile + " - IOException : " + e.getMessage()); - } - } else { - if (!destFile.getParentFile().exists() && !destFile.getParentFile().mkdirs()) - throw new KraftwerkException(500, "Can't create directory to archive"); - if (!sourceFile.renameTo(destFile)) - throw new KraftwerkException(500, "Can't rename file " + sourceFile + " to " + destFile); - } - } - - private String getRoot(Path path, String campaignName) { - String[] directories = path.toString().split(Pattern.quote(File.separator)); - int campaignIndex = Arrays.asList(directories).indexOf(campaignName); - String[] newDirectories = Arrays.copyOfRange(directories, campaignIndex + 1, directories.length); - StringBuilder result = new StringBuilder(); - String sep = ""; - for (String directory : newDirectories) { - result.append(sep).append(directory); - sep = File.separator; - } - return result.toString(); - } - @Override public void deleteDirectory(Path directoryPath) throws KraftwerkException { try { @@ -262,11 +172,135 @@ public long getSizeOf(String path) { @Override public void writeFile(String path, String toWrite, boolean replace) { - StandardOpenOption standardOpenOption = replace ? StandardOpenOption.TRUNCATE_EXISTING : StandardOpenOption.APPEND; + StandardOpenOption standardOpenOption = replace || !isFileExists(path) ? StandardOpenOption.CREATE : StandardOpenOption.APPEND; try { Files.write(Path.of(path), toWrite.getBytes(), standardOpenOption); }catch (IOException e){ log.error(e.toString()); } } + + @Override + public String findFile(String directory, String regex) throws KraftwerkException { + try (Stream files = Files.find(Path.of(directory), 1, (path, basicFileAttributes) -> path.toFile().getName().toLowerCase().matches(regex))) { + return files.findFirst() + .orElseThrow(() -> new KraftwerkException(404, "No DDI file (ddi*.xml) found in " + directory)).toString(); + }catch (IOException e){ + log.error(e.toString()); + return null; + } + } + + @Override + public InputStream readFile(String path) { + try{ + return Files.newInputStream(Path.of(path)); + }catch (IOException e){ + log.error(e.toString()); + return null; + } + } + + @Override + public boolean isFileExists(String path) { + return Files.exists(Path.of(path)); + } + + + // Utilities + + /** + * If reporting data, we move reporting data files + * @param inputFolder + * @param campaignName + * @param modeInputs + * @throws KraftwerkException + */ + private void archiveReportingData(Path inputFolder, String campaignName, ModeInputs modeInputs) + throws KraftwerkException { + if (modeInputs.getReportingDataFile() != null) { + moveDirectory(modeInputs.getReportingDataFile().toFile(), inputFolder.resolve(ARCHIVE) + .resolve(getRoot(modeInputs.getReportingDataFile(), campaignName)).toFile()); + } + } + + /** + * If paradata, we move the paradata folder + * @param inputFolder + * @param campaignName + * @param modeInputs + * @throws KraftwerkException + */ + private void archiveParadata(Path inputFolder, String campaignName, ModeInputs modeInputs) + throws KraftwerkException { + if (modeInputs.getParadataFolder() != null) { + moveDirectory(modeInputs.getParadataFolder().toFile(), inputFolder.resolve(ARCHIVE) + .resolve(getRoot(modeInputs.getParadataFolder(), campaignName)).toFile()); + } + } + + private void archiveData(Path inputFolder, String campaignName, ModeInputs modeInputs) + throws KraftwerkException { + Path dataPath = modeInputs.getDataFile(); + Path newDataPath = inputFolder.resolve(ARCHIVE).resolve(getRoot(dataPath, campaignName)); + + if (!Files.exists(newDataPath)) { + new File(newDataPath.getParent().toString()).mkdirs(); + } + if (Files.isRegularFile(dataPath)) { + moveFile(dataPath, newDataPath); + } else if (Files.isDirectory(dataPath)) { + moveDirectory(dataPath.toFile(),newDataPath.toFile()); + } else { + log.debug(String.format("No file or directory at path: %s", dataPath)); + } + } + + private void createArchiveDirectoryIfNotExists(Path inputFolder) { + if (!Files.exists(inputFolder.resolve(ARCHIVE))) { + inputFolder.resolve(ARCHIVE).toFile().mkdir(); + } + } + + private void moveFile(Path dataPath, Path newDataPath) throws KraftwerkException { + try { + Files.move(dataPath, newDataPath); + } catch (IOException e) { + throw new KraftwerkException(500, "Can't move file " + dataPath + " to " + newDataPath); + } + } + + + private void moveDirectory(File sourceFile, File destFile) throws KraftwerkException { + if (sourceFile.isDirectory()) { + File[] files = sourceFile.listFiles(); + assert files != null : "List of files in sourceFile is null"; + for (File file : files) + moveDirectory(file, new File(destFile, file.getName())); + try { + Files.delete(sourceFile.toPath()); + } catch (IOException e) { + throw new KraftwerkException(500, "Can't delete " + sourceFile + " - IOException : " + e.getMessage()); + } + } else { + if (!destFile.getParentFile().exists() && !destFile.getParentFile().mkdirs()) + throw new KraftwerkException(500, "Can't create directory to archive"); + if (!sourceFile.renameTo(destFile)) + throw new KraftwerkException(500, "Can't rename file " + sourceFile + " to " + destFile); + } + } + + private String getRoot(Path path, String campaignName) { + String[] directories = path.toString().split(Pattern.quote(File.separator)); + int campaignIndex = Arrays.asList(directories).indexOf(campaignName); + String[] newDirectories = Arrays.copyOfRange(directories, campaignIndex + 1, directories.length); + StringBuilder result = new StringBuilder(); + String sep = ""; + for (String directory : newDirectories) { + result.append(sep).append(directory); + sep = File.separator; + } + return result.toString(); + } + } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java index 857f755d..a8291a8d 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java @@ -6,6 +6,7 @@ import fr.insee.kraftwerk.core.inputs.UserInputsFile; import javax.annotation.Nullable; +import java.io.InputStream; import java.net.URL; import java.nio.file.Path; import java.time.LocalDateTime; @@ -13,6 +14,7 @@ import java.util.List; public interface FileUtilsInterface { + //TODO organize this static Path transformToOut(Path inDirectory) { return transformToOther(inDirectory, "out"); } @@ -42,6 +44,7 @@ private static Path transformToOther(Path inDirectory, String other) { void deleteDirectory(Path directoryPath) throws KraftwerkException; + //TODO change to listFilesNames List listFiles(String dir); List listFilePaths(String dir); @@ -67,5 +70,23 @@ private static Path transformToOther(Path inDirectory, String other) { */ long getSizeOf(String path); + /** + * Write a file in the path + * @param path path of the file + * @param toWrite String to write + * @param replace true if overwrite, false if append + */ void writeFile(String path, String toWrite, boolean replace); + + /** + * Find the file in the folder of a campaign + * @param directory directory where the file should be + * @param fileRegex regex of the file to match + * @return Path of the DDI file + * @throws KraftwerkException if no file found + */ + String findFile(String directory, String fileRegex) throws KraftwerkException; + InputStream readFile(String path); + + boolean isFileExists(String path); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java index eb65af93..268708ec 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -23,6 +23,7 @@ import java.io.ByteArrayInputStream; import java.io.File; import java.io.InputStream; +import java.io.OutputStream; import java.net.MalformedURLException; import java.net.URI; import java.net.URISyntaxException; @@ -42,13 +43,14 @@ public class MinioImpl implements FileUtilsInterface { MinioClient minioClient; String bucketName; + // Interface methods @Override public void renameInputFile(Path inDirectory) { String file1MinioPathString = inDirectory.resolve("/kraftwerk.json").toString(); String fileWithTime = "kraftwerk-" + DateUtils.getCurrentTimeStamp() + ".json"; String file2MinioPathString = inDirectory.resolve(fileWithTime).toString(); - if (isObjectExist(file2MinioPathString)) { + if (isFileExists(file2MinioPathString)) { log.warn(String.format("Trying to rename '%s' to '%s', but second file already exists.", Path.of(file1MinioPathString).getFileName(), Path.of(file2MinioPathString).getFileName())); log.warn("Timestamped input file will be over-written."); deleteFile(file2MinioPathString); @@ -72,50 +74,6 @@ public void archiveInputFiles(UserInputsFile userInputsFile) throws KraftwerkExc } } - private void archiveData(Path inputFolder, String campaignName, ModeInputs modeInputs) { - Path dataPath = modeInputs.getDataFile(); - Path newDataPath = inputFolder.resolve(ARCHIVE).resolve(getRoot(dataPath, campaignName)); - - if (!isDirectory(dataPath.toString())) { - moveFile(dataPath.toString(), newDataPath.toString()); - } else { - moveDirectory(dataPath.toString(), newDataPath.toString()); - } - } - - /** - * If paradata, we move the paradata folder - */ - private void archiveParadata(Path inputFolder, String campaignName, ModeInputs modeInputs){ - if (modeInputs.getParadataFolder() != null) { - moveDirectory(modeInputs.getParadataFolder().toString(), inputFolder.resolve(ARCHIVE) - .resolve(getRoot(modeInputs.getParadataFolder(), campaignName)).toString()); - } - } - - /** - * If reporting data, we move reporting data files - */ - private void archiveReportingData(Path inputFolder, String campaignName, ModeInputs modeInputs){ - if (modeInputs.getReportingDataFile() != null) { - moveDirectory(modeInputs.getReportingDataFile().toString(), inputFolder.resolve(ARCHIVE) - .resolve(getRoot(modeInputs.getReportingDataFile(), campaignName)).toString()); - } - } - - private String getRoot(Path path, String campaignName) { - String[] directories = path.toString().split(Pattern.quote(File.separator)); - int campaignIndex = Arrays.asList(directories).indexOf(campaignName); - String[] newDirectories = Arrays.copyOfRange(directories, campaignIndex + 1, directories.length); - StringBuilder result = new StringBuilder(); - String sep = ""; - for (String directory : newDirectories) { - result.append(sep).append(directory); - sep = File.separator; - } - return result.toString(); - } - @Override public void deleteDirectory(Path directoryPath) throws KraftwerkException { try { @@ -217,10 +175,13 @@ public void writeFile(String path, String toWrite, boolean replace) { writeFileOnMinio(path, inputStream, toWrite.length()); } + @Override + public String findFile(String directory, String fileRegex) throws KraftwerkException { + return null; //TODO faire ça + } - //Utilities - - private InputStream readFile(String minioPath) { + @Override + public InputStream readFile(String minioPath) { try { return minioClient.getObject(GetObjectArgs.builder().bucket(bucketName).object(minioPath).build()); } catch (Exception e) { @@ -229,6 +190,21 @@ private InputStream readFile(String minioPath) { } } + @Override + public boolean isFileExists(String objectPath) { + try { + minioClient.statObject(StatObjectArgs.builder().bucket(bucketName).object(objectPath).build()); + return true; + } catch (ErrorResponseException e) { + return false; + } catch (Exception e) { + log.error(e.toString()); + return false; + } + } + + //Utilities + private void writeFileOnMinio(String minioPath, InputStream inputStream, int fileSize) { try { minioClient.putObject(PutObjectArgs.builder().bucket(bucketName).stream(inputStream, fileSize, -1).object(minioPath).build()); @@ -280,15 +256,49 @@ private void deleteFile(String minioPath) { } } - private boolean isObjectExist(String objectPath) { - try { - minioClient.statObject(StatObjectArgs.builder().bucket(bucketName).object(objectPath).build()); - return true; - } catch (ErrorResponseException e) { - return false; - } catch (Exception e) { - log.error(e.toString()); - return false; + + + private void archiveData(Path inputFolder, String campaignName, ModeInputs modeInputs) { + Path dataPath = modeInputs.getDataFile(); + Path newDataPath = inputFolder.resolve(ARCHIVE).resolve(getRoot(dataPath, campaignName)); + + if (!isDirectory(dataPath.toString())) { + moveFile(dataPath.toString(), newDataPath.toString()); + } else { + moveDirectory(dataPath.toString(), newDataPath.toString()); } } + + /** + * If paradata, we move the paradata folder + */ + private void archiveParadata(Path inputFolder, String campaignName, ModeInputs modeInputs){ + if (modeInputs.getParadataFolder() != null) { + moveDirectory(modeInputs.getParadataFolder().toString(), inputFolder.resolve(ARCHIVE) + .resolve(getRoot(modeInputs.getParadataFolder(), campaignName)).toString()); + } + } + + /** + * If reporting data, we move reporting data files + */ + private void archiveReportingData(Path inputFolder, String campaignName, ModeInputs modeInputs){ + if (modeInputs.getReportingDataFile() != null) { + moveDirectory(modeInputs.getReportingDataFile().toString(), inputFolder.resolve(ARCHIVE) + .resolve(getRoot(modeInputs.getReportingDataFile(), campaignName)).toString()); + } + } + + private String getRoot(Path path, String campaignName) { + String[] directories = path.toString().split(Pattern.quote(File.separator)); + int campaignIndex = Arrays.asList(directories).indexOf(campaignName); + String[] newDirectories = Arrays.copyOfRange(directories, campaignIndex + 1, directories.length); + StringBuilder result = new StringBuilder(); + String sep = ""; + for (String directory : newDirectories) { + result.append(sep).append(directory); + sep = File.separator; + } + return result.toString(); + } } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java index e24b8999..e32055f9 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java @@ -7,6 +7,7 @@ import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.utils.TextFileWriter; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.vtl.jackson.TrevasModule; import fr.insee.vtl.model.Dataset; import lombok.extern.log4j.Log4j2; @@ -36,14 +37,16 @@ public class VtlExecute { private final ObjectMapper mapper; /** Engine that will execute VTL instructions */ private final ScriptEngine engine; + private final FileUtilsInterface fileUtilsInterface; - public VtlExecute(){ + public VtlExecute(FileUtilsInterface fileUtilsInterface){ mapper = new ObjectMapper(); mapper.registerModule(new TrevasModule()); // Engine engine = new ScriptEngineManager() .getEngineByName("vtl"); + this.fileUtilsInterface = fileUtilsInterface; } /** @@ -67,7 +70,7 @@ public void convertToVtlDataset(SurveyRawData surveyRawData, String bindingName, Path tempDataset = Paths.get(tempDatasetPath); try { - Files.delete(tempDataset); //TODO Change to use interface + Files.delete(tempDataset); log.debug("File {} deleted",tempDatasetPath); } catch (IOException e) { log.debug("Impossible to delete file {}",tempDatasetPath); @@ -123,7 +126,7 @@ public void writeJsonDataset(String bindingName, Path jsonOutFile, VtlBindings b //Write file if (bindings.containsKey(bindingName)) { try { - TextFileWriter.writeFile(jsonOutFile, mapper.writeValueAsString(bindings.getDataset(bindingName))); + TextFileWriter.writeFile(jsonOutFile, mapper.writeValueAsString(bindings.getDataset(bindingName)), fileUtilsInterface); } catch (JsonProcessingException e) { log.debug(String.format("Unable to serialize dataset stored under name '%s'.", bindingName), e); } diff --git a/kraftwerk-core/src/test/java/cucumber/unit_tests/AggregateDefinitions.java b/kraftwerk-core/src/test/java/cucumber/unit_tests/AggregateDefinitions.java index f7ea2db3..00ed2efb 100644 --- a/kraftwerk-core/src/test/java/cucumber/unit_tests/AggregateDefinitions.java +++ b/kraftwerk-core/src/test/java/cucumber/unit_tests/AggregateDefinitions.java @@ -7,6 +7,7 @@ import fr.insee.kraftwerk.core.dataprocessing.ReconciliationProcessing; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.rawdata.SurveyRawDataTest; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; import io.cucumber.java.en.Given; @@ -25,7 +26,7 @@ public class AggregateDefinitions { public List errors = new ArrayList<>(); - VtlExecute vtlExecute = new VtlExecute(); + VtlExecute vtlExecute = new VtlExecute(new FileSystemImpl()); @Given("We have some VTLBindings named {string} and {string}") public void initialize(String firstDataset, String secondDataset){ @@ -35,9 +36,9 @@ public void initialize(String firstDataset, String secondDataset){ vtlExecute.convertToVtlDataset(fakeCawiData, firstDataset, vtlBindings); vtlExecute.convertToVtlDataset(fakePapiData, secondDataset, vtlBindings); // add group prefixes - GroupProcessing groupProcessing = new GroupProcessing(vtlBindings, fakeCawiData.getMetadataModel()); + GroupProcessing groupProcessing = new GroupProcessing(vtlBindings, fakeCawiData.getMetadataModel(), new FileSystemImpl()); groupProcessing.applyVtlTransformations(firstDataset, null,errors); - GroupProcessing groupProcessing2 = new GroupProcessing(vtlBindings, fakePapiData.getMetadataModel()); + GroupProcessing groupProcessing2 = new GroupProcessing(vtlBindings, fakePapiData.getMetadataModel(), new FileSystemImpl()); groupProcessing2.applyVtlTransformations(secondDataset, null,errors); // @@ -47,7 +48,7 @@ public void initialize(String firstDataset, String secondDataset){ @When("I try to aggregate the bindings") public void collect_variables() { - DataProcessing reconciliationProcessing = new ReconciliationProcessing(vtlBindings); + DataProcessing reconciliationProcessing = new ReconciliationProcessing(vtlBindings, new FileSystemImpl()); reconciliationProcessing.applyVtlTransformations( "MULTIMODE", null,errors); } diff --git a/kraftwerk-core/src/test/java/cucumber/unit_tests/EvalScriptDefinitions.java b/kraftwerk-core/src/test/java/cucumber/unit_tests/EvalScriptDefinitions.java index d80db367..02108eef 100644 --- a/kraftwerk-core/src/test/java/cucumber/unit_tests/EvalScriptDefinitions.java +++ b/kraftwerk-core/src/test/java/cucumber/unit_tests/EvalScriptDefinitions.java @@ -8,6 +8,7 @@ import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.rawdata.SurveyRawDataTest; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; import io.cucumber.java.en.Given; @@ -18,7 +19,7 @@ public class EvalScriptDefinitions { public VtlBindings vtlBindings = new VtlBindings(); - VtlExecute vtlExecute = new VtlExecute(); + VtlExecute vtlExecute = new VtlExecute(new FileSystemImpl()); @Given("We have some simple VTLBindings") public void initialize() throws Exception { diff --git a/kraftwerk-core/src/test/java/cucumber/unit_tests/ExportDatasetDefinitions.java b/kraftwerk-core/src/test/java/cucumber/unit_tests/ExportDatasetDefinitions.java index 2ff6c225..7e4c9adc 100644 --- a/kraftwerk-core/src/test/java/cucumber/unit_tests/ExportDatasetDefinitions.java +++ b/kraftwerk-core/src/test/java/cucumber/unit_tests/ExportDatasetDefinitions.java @@ -4,6 +4,7 @@ import fr.insee.kraftwerk.core.dataprocessing.GroupProcessing; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.rawdata.SurveyRawDataTest; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; import fr.insee.kraftwerk.core.vtl.VtlJsonDatasetWriter; @@ -22,7 +23,7 @@ public class ExportDatasetDefinitions { public String tempDatasetPath = ""; public SurveyRawData survey = null; - VtlExecute vtlExecute = new VtlExecute(); + VtlExecute vtlExecute = new VtlExecute(new FileSystemImpl()); @Given("We have some SurveyRawData named {string}") public void initialize(String nameDataset) throws Exception { @@ -44,7 +45,7 @@ public void exportDataset(String nameDataset) throws Exception { public void importDataset(String nameDataset) throws Exception { vtlExecute.putVtlDataset(tempDatasetPath, "OUTPUT_TEST_EXPORT", vtlBindings); // add group prefixes - GroupProcessing groupProcessing = new GroupProcessing(vtlBindings, survey.getMetadataModel()); + GroupProcessing groupProcessing = new GroupProcessing(vtlBindings, survey.getMetadataModel(), new FileSystemImpl()); groupProcessing.applyVtlTransformations("OUTPUT_TEST_EXPORT", null, new ArrayList<>()); } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/CalculatedProcessingTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/CalculatedProcessingTest.java index d9eca49a..ba51b4c5 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/CalculatedProcessingTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/CalculatedProcessingTest.java @@ -6,6 +6,8 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.metadata.Variable; import fr.insee.kraftwerk.core.metadata.VariableType; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlScript; import fr.insee.vtl.model.Dataset; @@ -27,6 +29,7 @@ class CalculatedProcessingTest { private static MetadataModel fooMetadataModel; private static VtlBindings vtlBindings; private static List errors; + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); @BeforeAll static void setFooCalculated() { @@ -52,7 +55,7 @@ static void setFooCalculated() { @Test void testIfCalculatedAreCorrectlyResolved() { // - CalculatedProcessing processing = new CalculatedProcessing(vtlBindings, fooCalculated); + CalculatedProcessing processing = new CalculatedProcessing(vtlBindings, fooCalculated, fileUtilsInterface); VtlScript vtlScript = processing.generateVtlInstructions("TEST"); // @@ -68,7 +71,7 @@ void testIfCalculatedAreProcessed() { // VtlBindings vtlBindings = getVtlBindings(); // - CalculatedProcessing processing = new CalculatedProcessing(vtlBindings, fooCalculated); + CalculatedProcessing processing = new CalculatedProcessing(vtlBindings, fooCalculated, fileUtilsInterface); processing.applyAutomatedVtlInstructions("TEST", errors); // Dataset outDataset = vtlBindings.getDataset("TEST"); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/CleanUpProcessingTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/CleanUpProcessingTest.java index d7887cf2..223b0728 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/CleanUpProcessingTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/CleanUpProcessingTest.java @@ -3,6 +3,8 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.metadata.*; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.vtl.model.Dataset; import fr.insee.vtl.model.Dataset.Role; @@ -17,6 +19,8 @@ class CleanUpProcessingTest { + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + Dataset cawiDataset = new InMemoryDataset( List.of( List.of("T01", "foo", "2"), @@ -95,7 +99,7 @@ void applyCleanUp() { vtlBindings.put("MULTIMODE", multimodeDataset); // Apply clean up - CleanUpProcessing cleanUpProcessing = new CleanUpProcessing(vtlBindings, metadatas); + CleanUpProcessing cleanUpProcessing = new CleanUpProcessing(vtlBindings, metadatas, fileUtilsInterface); cleanUpProcessing.applyVtlTransformations("MULTIMODE", null,errors); // Are paper indicator variables removed in VTL multimode dataset ? diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/GroupProcessingTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/GroupProcessingTest.java index 309c1d91..bc7a3eed 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/GroupProcessingTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/GroupProcessingTest.java @@ -2,6 +2,8 @@ import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.metadata.*; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.vtl.model.Dataset; import fr.insee.vtl.model.InMemoryDataset; @@ -16,6 +18,8 @@ class GroupProcessingTest { + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + @Test void addPrefixes() { // @@ -41,7 +45,7 @@ void addPrefixes() { metadata.getVariables().putVariable(new Variable("FOO1", metadata.getGroup("DEPTH1"), VariableType.NUMBER)); metadata.getVariables().putVariable(new Variable("FOO2", metadata.getGroup("DEPTH2"), VariableType.NUMBER)); // - new GroupProcessing(vtlBindings, metadata).applyAutomatedVtlInstructions("TEST",errors); + new GroupProcessing(vtlBindings, metadata, fileUtilsInterface).applyAutomatedVtlInstructions("TEST",errors); Dataset outDataset = vtlBindings.getDataset("TEST"); // diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/InformationLevelsTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/InformationLevelsTest.java index 661c848c..c347bbf8 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/InformationLevelsTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/InformationLevelsTest.java @@ -8,6 +8,8 @@ import java.util.Map; import java.util.Set; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.Test; import fr.insee.kraftwerk.core.Constants; @@ -18,7 +20,7 @@ import fr.insee.vtl.model.InMemoryDataset; class InformationLevelsTest { - + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); private final String rootId = Constants.ROOT_IDENTIFIER_NAME; Dataset testDataset = new InMemoryDataset( @@ -52,7 +54,7 @@ void applyInformationLevelsProcessing() { VtlBindings vtlBindings = new VtlBindings(); vtlBindings.put("MULTIMODE", testDataset); // - InformationLevelsProcessing processing = new InformationLevelsProcessing(vtlBindings); + InformationLevelsProcessing processing = new InformationLevelsProcessing(vtlBindings, fileUtilsInterface); processing.applyAutomatedVtlInstructions("MULTIMODE",errors); // Dataset rootDataset = vtlBindings.getDataset(Constants.ROOT_GROUP_NAME); @@ -92,7 +94,7 @@ void applyInformationLevelsProcessingWithPartialIdNUll() { VtlBindings vtlBindings = new VtlBindings(); vtlBindings.put("MULTIMODE", testDatasetWithPartialIdNull); // - InformationLevelsProcessing processing = new InformationLevelsProcessing(vtlBindings); + InformationLevelsProcessing processing = new InformationLevelsProcessing(vtlBindings, fileUtilsInterface); processing.applyAutomatedVtlInstructions("MULTIMODE",errors); // Dataset rootDataset = vtlBindings.getDataset(Constants.ROOT_GROUP_NAME); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/PaperDataProcessingTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/PaperDataProcessingTest.java index 936ec8a7..d118a392 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/PaperDataProcessingTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/PaperDataProcessingTest.java @@ -2,6 +2,8 @@ import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.metadata.*; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.vtl.model.Dataset; import fr.insee.vtl.model.Dataset.Role; @@ -16,7 +18,7 @@ import static org.junit.Assert.assertNotNull; class PaperDataProcessingTest { - + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); Dataset paperDataset = new InMemoryDataset( List.of( // Correct answers @@ -70,7 +72,7 @@ void testPaperDataProcessing() { VtlBindings vtlBindings = new VtlBindings(); vtlBindings.put("TEST", paperDataset); // - PaperDataProcessing paperDataProcessing = new PaperDataProcessing(vtlBindings, metadataModel); + PaperDataProcessing paperDataProcessing = new PaperDataProcessing(vtlBindings, metadataModel, fileUtilsInterface); paperDataProcessing.applyAutomatedVtlInstructions("TEST", errors); // Dataset paperDsModified = vtlBindings.getDataset("TEST"); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/ReconciliationTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/ReconciliationTest.java index 1c45c0d2..58bf71c0 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/ReconciliationTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/ReconciliationTest.java @@ -2,6 +2,8 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.KraftwerkError; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.vtl.model.Dataset; import fr.insee.vtl.model.Dataset.Role; @@ -23,6 +25,7 @@ class ReconciliationTest { private VtlBindings vtlBindings; private List errors; + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); InMemoryDataset capiDataset = new InMemoryDataset( List.of( @@ -80,7 +83,7 @@ void applyReconciliation_singleMode(String dsName) { // vtlBindings.put("SINGLE_MODE", testDatasets.get(dsName)); // - ReconciliationProcessing reconciliation = new ReconciliationProcessing(vtlBindings); + ReconciliationProcessing reconciliation = new ReconciliationProcessing(vtlBindings, fileUtilsInterface); reconciliation.applyVtlTransformations("MULTIMODE", null,errors); // Dataset multimodeDataset = vtlBindings.getDataset("MULTIMODE"); @@ -92,7 +95,7 @@ private Dataset applyReconciliation_twoModes(String mode1, String mode2) { vtlBindings.put(mode1, testDatasets.get(mode1)); vtlBindings.put(mode2, testDatasets.get(mode2)); // - ReconciliationProcessing reconciliation = new ReconciliationProcessing(vtlBindings); + ReconciliationProcessing reconciliation = new ReconciliationProcessing(vtlBindings, fileUtilsInterface); reconciliation.applyVtlTransformations("MULTIMODE", null,errors); // return vtlBindings.getDataset("MULTIMODE"); @@ -136,7 +139,7 @@ void applyReconciliation_threeModes() { vtlBindings.put("CAWI", capiDataset); vtlBindings.put("PAPI", papiDataset); // - ReconciliationProcessing reconciliation = new ReconciliationProcessing(vtlBindings); + ReconciliationProcessing reconciliation = new ReconciliationProcessing(vtlBindings, fileUtilsInterface); reconciliation.applyVtlTransformations("MULTIMODE", null,errors); // Dataset multimodeDataset = vtlBindings.getDataset("MULTIMODE"); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/TCMSequenceProcessingTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/TCMSequenceProcessingTest.java index 60196fad..9e40b6f4 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/TCMSequenceProcessingTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/dataprocessing/TCMSequenceProcessingTest.java @@ -4,6 +4,8 @@ import fr.insee.kraftwerk.core.TestConstants; import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.metadata.Sequence; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.vtl.model.Dataset; import fr.insee.vtl.model.InMemoryDataset; @@ -26,6 +28,8 @@ class TCMSequenceProcessingTest { static final String FORMAT_INSTRUCTION = "/* Instruction %s */"; static final List modules = new ArrayList<>(); + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + //Given static Dataset unimodalDataset = new InMemoryDataset( List.of( @@ -77,7 +81,7 @@ void check_standard_vtl_execution(){ String expectedScript = expectedScriptBuilder.toString(); //WHEN - TCMSequencesProcessing processing = new TCMSequencesProcessing(vtlBindings, metadataModel, Path.of(TestConstants.UNIT_TESTS_DIRECTORY).resolve("vtl").toString()); + TCMSequencesProcessing processing = new TCMSequencesProcessing(vtlBindings, metadataModel, Path.of(TestConstants.UNIT_TESTS_DIRECTORY).resolve("vtl").toString(), fileUtilsInterface); String scriptString = processing.applyAutomatedVtlInstructions("TEST", errors); //THEN diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/CSVReportingDataParserTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/CSVReportingDataParserTest.java index 27d580e9..ec501205 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/CSVReportingDataParserTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/CSVReportingDataParserTest.java @@ -7,6 +7,8 @@ import fr.insee.kraftwerk.core.extradata.reportingdata.ReportingDataUE; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.rawdata.SurveyRawDataTest; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.Test; @@ -16,9 +18,11 @@ class CSVReportingDataParserTest { + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + @Test void parseReportingDataTest() { - CSVReportingDataParser csvReportingDataParser = new CSVReportingDataParser(); + CSVReportingDataParser csvReportingDataParser = new CSVReportingDataParser(fileUtilsInterface); SurveyRawData data = SurveyRawDataTest.createFakePapiSurveyRawData(); ReportingData reportingData = new ReportingData( @@ -48,7 +52,7 @@ void parseReportingDataTest() { @Test void controlHeaderTest() { - CSVReportingDataParser csvReportingDataParser = new CSVReportingDataParser(); + CSVReportingDataParser csvReportingDataParser = new CSVReportingDataParser(fileUtilsInterface); String[] validHeaderToControl = new String [] {"statut", "dateInfo", "idUe", "idContact", "nom", "prenom", "adresse", "numeroDeLot"}; String[] invalidHeaderWrongValues = new String [] {"statut", "dateInfo", "idUe2", "idContact", "nom", "prenom", "adresse2", "numeroDeLot2"}; String[] headerToControlWrongSize = new String [] {"statut", "dateInfo", "idUe", "idContact", "nom", "prenom", "adresse", "numeroDeLot", "ninth"}; @@ -60,7 +64,7 @@ void controlHeaderTest() { @Test void convertDateTest() { - CSVReportingDataParser csvReportingDataParser = new CSVReportingDataParser(); + CSVReportingDataParser csvReportingDataParser = new CSVReportingDataParser(fileUtilsInterface); assertEquals(1645007098, csvReportingDataParser.convertToTimestamp("16/02/2022 11:24:58")); assertEquals(1566544132, csvReportingDataParser.convertToTimestamp("23/08/2019 09:08:52")); assertEquals(1111111111, csvReportingDataParser.convertToTimestamp("18/03/2005 02:58:31")); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/ParaDataParserTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/ParaDataParserTest.java index a78413a1..efbc56d1 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/ParaDataParserTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/ParaDataParserTest.java @@ -8,6 +8,7 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import org.junit.jupiter.api.Assertions; import org.junit.jupiter.api.Test; @@ -21,7 +22,7 @@ class ParaDataParserTest { - ParadataParser paradataParser = new ParadataParser(); + ParadataParser paradataParser = new ParadataParser(new FileSystemImpl()); @Test void catchExceptionAndErrors() { diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/XMLReportingDataParserTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/XMLReportingDataParserTest.java index 31211074..209419d4 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/XMLReportingDataParserTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/extradata/XMLReportingDataParserTest.java @@ -9,6 +9,8 @@ import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.rawdata.SurveyRawDataTest; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.Test; import java.nio.file.Paths; @@ -18,9 +20,11 @@ class XMLReportingDataParserTest { + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + @Test void parseReportingDataTest() { - XMLReportingDataParser xMLReportingDataParser = new XMLReportingDataParser(); + XMLReportingDataParser xMLReportingDataParser = new XMLReportingDataParser(fileUtilsInterface); SurveyRawData data = SurveyRawDataTest.createFakePapiSurveyRawData(); ReportingData reportingData = new ReportingData( @@ -62,7 +66,7 @@ void parseReportingDataTest() { @Test void parseMoogReportingDataTest(){ - XMLReportingDataParser xMLReportingDataParser = new XMLReportingDataParser(); + XMLReportingDataParser xMLReportingDataParser = new XMLReportingDataParser(fileUtilsInterface); SurveyRawData data = SurveyRawDataTest.createFakePapiSurveyRawData(); ReportingData reportingData = new ReportingData( @@ -154,7 +158,7 @@ void parseMoogReportingDataTest(){ @Test void maxTest() { - XMLReportingDataParser xMLReportingDataParser = new XMLReportingDataParser(); + XMLReportingDataParser xMLReportingDataParser = new XMLReportingDataParser(fileUtilsInterface); ReportingData reportingData = new ReportingData(); reportingData.putReportingDataUE(ReportingDataUETest.createFakeReportingDataUEs()); assertEquals(5, xMLReportingDataParser.countMaxStates(reportingData)); //remove double @@ -162,7 +166,7 @@ void maxTest() { @Test void maxTest_noData() { - XMLReportingDataParser xMLReportingDataParser = new XMLReportingDataParser(); + XMLReportingDataParser xMLReportingDataParser = new XMLReportingDataParser(fileUtilsInterface); ReportingData reportingData = new ReportingData(); assertEquals(0, xMLReportingDataParser.countMaxStates(reportingData)); assertEquals(0, xMLReportingDataParser.countMaxAttempts(reportingData)); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/DDIReaderTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/DDIReaderTest.java index dcb80462..70697ecc 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/DDIReaderTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/DDIReaderTest.java @@ -3,6 +3,8 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.TestConstants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.Test; import java.net.MalformedURLException; @@ -27,6 +29,8 @@ class DDIReaderTest { static final String DDI_LOG_X21 = "ddi-log-2021-x21-web.xml"; static final String DDI_LOG_X22 = "S2_WEB.xml"; + static final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + @Test void readSimpsonsV1Variables() throws MalformedURLException, KraftwerkException, URISyntaxException { @@ -41,7 +45,7 @@ void readSimpsonsV1Variables() throws MalformedURLException, KraftwerkException, "SURVEY_COMMENT"); MetadataModel simpsonsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V1)); + .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V1), fileUtilsInterface); // assertNotNull(simpsonsMetadata); @@ -79,7 +83,7 @@ void readSimpsonsV2Variables() throws MalformedURLException, KraftwerkException, "FEELCHAREV4", "LEAVDURATION11", "LEAVDURATION52", "NB_CHAR", "SURVEY_COMMENT"); MetadataModel simpsonsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V2)); + .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V2), fileUtilsInterface); // assertNotNull(simpsonsMetadata); @@ -107,7 +111,7 @@ void readVqsWebVariables() throws MalformedURLException, KraftwerkException, URI "RESIDM", "NHAB"); MetadataModel vqsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_WEB)); + .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_WEB), fileUtilsInterface); // assertNotNull(vqsMetadata); @@ -147,7 +151,7 @@ void readVqsPapVariables() throws MalformedURLException, KraftwerkException, URI "AIDREG_B", "AIDREG_C", "AIDREG_D", "RESID", "RESIDANCIEN", "NBQUEST"); MetadataModel vqsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_PAP)); + .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_PAP), fileUtilsInterface); // assertNotNull(vqsMetadata); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/VariableTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/VariableTest.java index 37b9db3e..9288af0a 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/VariableTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/VariableTest.java @@ -3,6 +3,8 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.TestConstants; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.Test; import java.net.MalformedURLException; @@ -19,6 +21,7 @@ class VariableTest { static final String DDI_SIMPSONS_V2 = "ddi-simpsons-v2.xml"; static final String DDI_VQS_WEB = "vqs-2021-x00-xforms-ddi.xml"; static final String DDI_VQS_PAP = "vqs-2021-x00-fo-ddi.xml"; + static final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); @Test void readSimpsonsV1Variables() throws MalformedURLException, KraftwerkException, URISyntaxException { @@ -34,7 +37,7 @@ void readSimpsonsV1Variables() throws MalformedURLException, KraftwerkException, "SURVEY_COMMENT"); MetadataModel simpsonsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V1)); + .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V1), fileUtilsInterface); // assertNotNull(simpsonsMetadata); @@ -72,7 +75,7 @@ void readSimpsonsV2Variables() throws MalformedURLException, KraftwerkException, "FEELCHAREV4", "LEAVDURATION11", "LEAVDURATION52", "NB_CHAR", "SURVEY_COMMENT"); MetadataModel simpsonsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V2)); + .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V2), fileUtilsInterface); // assertNotNull(simpsonsMetadata); @@ -100,7 +103,7 @@ void readVqsWebVariables() throws MalformedURLException, KraftwerkException, URI "RESIDM", "NHAB"); MetadataModel vqsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_WEB)); + .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_WEB), fileUtilsInterface); // assertNotNull(vqsMetadata); @@ -140,7 +143,7 @@ void readVqsPapVariables() throws MalformedURLException, KraftwerkException, URI "AIDREG_B", "AIDREG_C", "AIDREG_D", "RESID", "RESIDANCIEN", "NBQUEST"); MetadataModel vqsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_PAP)); + .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_PAP), fileUtilsInterface); // assertNotNull(vqsMetadata); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java index 16b4b5f4..27149885 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/CsvOutputFilesTest.java @@ -72,7 +72,7 @@ void createInstance() { // database = SqlUtils.openConnection(); SqlUtils.convertVtlBindingsIntoSqlDatabase(vtlBindings, database.createStatement()); - outputFiles = new CsvOutputFiles(Paths.get(TestConstants.UNIT_TESTS_DUMP), vtlBindings, testUserInputsFile.getModes(), database.createStatement()); + outputFiles = new CsvOutputFiles(Paths.get(TestConstants.UNIT_TESTS_DUMP), vtlBindings, testUserInputsFile.getModes(), database.createStatement(), fileUtilsInterface); }); } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java index 6840d859..a4b9fd82 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java @@ -76,7 +76,7 @@ static void createInstance() throws SQLException { vtlBindings.put("FROM_USER", testDataset); // SqlUtils.convertVtlBindingsIntoSqlDatabase(vtlBindings, testDatabase); - outputFiles = new ParquetOutputFiles(Paths.get(TestConstants.UNIT_TESTS_DUMP), vtlBindings, testUserInputs.getModes(), testDatabase); + outputFiles = new ParquetOutputFiles(Paths.get(TestConstants.UNIT_TESTS_DUMP), vtlBindings, testUserInputs.getModes(), testDatabase, fileUtilsInterface); }); } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/scripts/ImportScriptTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/scripts/ImportScriptTest.java index 5d9c2513..b3e48d64 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/scripts/ImportScriptTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/scripts/ImportScriptTest.java @@ -10,6 +10,8 @@ import fr.insee.kraftwerk.core.outputs.TableScriptInfo; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.rawdata.SurveyRawDataTest; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; import fr.insee.vtl.model.Dataset; @@ -36,8 +38,9 @@ class ImportScriptTest { TableScriptInfo tableScriptInfo; Map metadata; + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); - VtlExecute vtlExecute = new VtlExecute(); + VtlExecute vtlExecute = new VtlExecute(fileUtilsInterface); @BeforeEach public void initMetadata() { @@ -57,9 +60,9 @@ private void instantiateMap() { // add group prefixes List errors = new ArrayList<>(); - GroupProcessing groupProcessing = new GroupProcessing(vtlBindings, srdWeb.getMetadataModel()); + GroupProcessing groupProcessing = new GroupProcessing(vtlBindings, srdWeb.getMetadataModel(), fileUtilsInterface); groupProcessing.applyVtlTransformations("CAWI", null, errors); - GroupProcessing groupProcessing2 = new GroupProcessing(vtlBindings, srdPaper.getMetadataModel()); + GroupProcessing groupProcessing2 = new GroupProcessing(vtlBindings, srdPaper.getMetadataModel(), fileUtilsInterface); groupProcessing2.applyVtlTransformations("PAPI", null, errors); dataStructure = vtlBindings.getDataset("CAWI").getDataStructure(); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParserTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParserTest.java index 9909320d..ae00e02b 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParserTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParserTest.java @@ -9,6 +9,8 @@ import fr.insee.kraftwerk.core.rawdata.GroupData; import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.Test; import java.nio.file.Path; @@ -23,11 +25,12 @@ class LunaticXmlDataParserTest { private final String dataSamplesFolder = TestConstants.UNIT_TESTS_DIRECTORY + "/data"; + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); @Test void readXmlFile_null() { SurveyRawData data = new SurveyRawData("TEST"); - LunaticXmlDataParser parser = new LunaticXmlDataParser(data); + LunaticXmlDataParser parser = new LunaticXmlDataParser(data, fileUtilsInterface); assertThrows(NullPointerException.class,() ->parser.parseDataFile(null)); parser.parseDataFile(Path.of("notfound.xml")); @@ -43,7 +46,7 @@ void parseLunaticDataFolder() throws NullException { metadataModel.getVariables().putVariable(new Variable("FOO", metadataModel.getRootGroup(), VariableType.STRING)); data.setMetadataModel(metadataModel); Path dataPath = Paths.get(dataSamplesFolder + "/lunatic_xml/fake-multiple-files"); - LunaticXmlDataParser parser = new LunaticXmlDataParser(data); + LunaticXmlDataParser parser = new LunaticXmlDataParser(data, fileUtilsInterface); parser.parseSurveyData(dataPath,null); // @@ -63,7 +66,7 @@ void parseLunaticXml_rootOnly() throws NullException { SurveyRawData data = new SurveyRawData("TEST"); data.setMetadataModel(MetadataModelTest.createVariablesMap_rootOnly()); Path dataPath = Paths.get(dataSamplesFolder + "/lunatic_xml/fake-lunatic-data-root-only.xml"); - LunaticXmlDataParser parser = new LunaticXmlDataParser(data); + LunaticXmlDataParser parser = new LunaticXmlDataParser(data, fileUtilsInterface); parser.parseSurveyData(dataPath,null); // @@ -96,7 +99,7 @@ void parseLunaticXml_oneLevel() throws NullException { SurveyRawData data = new SurveyRawData("TEST"); data.setMetadataModel(MetadataModelTest.createVariablesMap_oneLevel()); Path dataPath = Paths.get(dataSamplesFolder + "/lunatic_xml/fake-lunatic-data-1.xml"); - LunaticXmlDataParser parser = new LunaticXmlDataParser(data); + LunaticXmlDataParser parser = new LunaticXmlDataParser(data, fileUtilsInterface); parser.parseSurveyData(dataPath,null); // @@ -130,7 +133,7 @@ void parseLunaticXml_noCollected() throws NullException { SurveyRawData data = new SurveyRawData("TEST"); data.setMetadataModel(MetadataModelTest.createVariablesMap_oneLevel()); Path dataPath = Paths.get(dataSamplesFolder + "/lunatic_xml/fake-lunatic-data-3.xml"); - LunaticXmlDataParser parser = new LunaticXmlDataParser(data); + LunaticXmlDataParser parser = new LunaticXmlDataParser(data, fileUtilsInterface); //When parser.parseSurveyData(dataPath,null); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/parsers/PaperDataParserTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/parsers/PaperDataParserTest.java index 798f6dfe..5cfd4adc 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/parsers/PaperDataParserTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/parsers/PaperDataParserTest.java @@ -7,6 +7,8 @@ import fr.insee.kraftwerk.core.metadata.VariableType; import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.assertj.core.api.Assertions; import org.junit.jupiter.api.Test; @@ -18,12 +20,13 @@ class PaperDataParserTest { private final String dataSamplesFolder = TestConstants.UNIT_TESTS_DIRECTORY + "/data"; + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); @Test void readPaperFile_null() { //Given SurveyRawData data = new SurveyRawData("TEST"); - PaperDataParser parser = new PaperDataParser(data); + PaperDataParser parser = new PaperDataParser(data, fileUtilsInterface); //When + Then assertThrows(NullPointerException.class,() ->parser.parseDataFile(null)); @@ -39,7 +42,7 @@ void parsePaperDataFile() throws NullException, NumberFormatException { metadataModel.getVariables().putVariable(new Variable("TESTINT1", metadataModel.getRootGroup(), VariableType.INTEGER)); data.setMetadataModel(metadataModel); Path dataPath = Paths.get(dataSamplesFolder + "/paper_csv/fake-paper-data.csv"); - PaperDataParser parser = new PaperDataParser(data); + PaperDataParser parser = new PaperDataParser(data, fileUtilsInterface); //When parser.parseSurveyData(dataPath,null); @@ -72,7 +75,7 @@ void parsePaperDataFolder() throws NullException, NumberFormatException { metadataModel.getVariables().putVariable(new Variable("TESTINT1", metadataModel.getRootGroup(), VariableType.INTEGER)); data.setMetadataModel(metadataModel); Path dataPath = Paths.get(dataSamplesFolder + "/paper_csv/fake-multiple-files"); - PaperDataParser parser = new PaperDataParser(data); + PaperDataParser parser = new PaperDataParser(data, fileUtilsInterface); //When parser.parseSurveyData(dataPath,null); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java index 43e9abf2..d17b2a03 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java @@ -36,7 +36,7 @@ void buildVtlBindings_errorWithoutMetadata() throws KraftwerkException { VtlBindings vtlBindings = new VtlBindings(); boolean withAllReportingData = false; boolean withDdi = true; - BuildBindingsSequence bbs = new BuildBindingsSequence(withAllReportingData); + BuildBindingsSequence bbs = new BuildBindingsSequence(withAllReportingData, new FileSystemImpl()); //WHEN MetadataModel metadata = null; @@ -54,7 +54,7 @@ void buildVtlBindings_success_changingDdi_and_reportingData(boolean withDdi, boo inputSamplesDirectory, fileUtilsInterface); String dataMode = "CAPI"; VtlBindings vtlBindings = new VtlBindings(); - BuildBindingsSequence bbs = new BuildBindingsSequence(withAllReportingData); + BuildBindingsSequence bbs = new BuildBindingsSequence(withAllReportingData, new FileSystemImpl()); MetadataModel capiMetadata = new MetadataModel(); capiMetadata.getVariables().putVariable(new Variable("VAR1", capiMetadata.getRootGroup(), VariableType.STRING)); capiMetadata.getVariables().putVariable(new UcqVariable("PAYSNAIS", capiMetadata.getRootGroup(), VariableType.STRING)); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java index c2947789..700437e3 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java @@ -3,6 +3,8 @@ import java.net.MalformedURLException; import java.nio.file.Path; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.Test; import org.xmlunit.assertj3.XmlAssert; @@ -11,8 +13,10 @@ class SaxonTransformerTest { + FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + @Test - void applyXsltScript() throws MalformedURLException { + void applyXsltScript(){ String xsltTestScript = TestConstants.UNIT_TESTS_DIRECTORY + "/utils/xsl/do-nothing.xsl"; String inXmlFile = TestConstants.UNIT_TESTS_DIRECTORY + "/utils/xsl/note.xml"; String outXmlFile = TestConstants.UNIT_TESTS_DUMP + "/xsl-output.xml"; @@ -20,8 +24,8 @@ void applyXsltScript() throws MalformedURLException { SaxonTransformer saxonTransformer = new SaxonTransformer(); saxonTransformer.xslTransform(Path.of(inXmlFile), xsltTestScript,Path.of(outXmlFile)); // - String inContent = TextFileReader.readFromPath(Path.of(inXmlFile)); - String outContent = TextFileReader.readFromPath(Path.of(outXmlFile)); + String inContent = TextFileReader.readFromPath(Path.of(inXmlFile), fileUtilsInterface); + String outContent = TextFileReader.readFromPath(Path.of(outXmlFile), fileUtilsInterface); // XmlAssert.assertThat(inContent).and(outContent).areSimilar(); } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/vtl/VtlBindingsTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/vtl/VtlBindingsTest.java index 963b58f7..93cf2fb8 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/vtl/VtlBindingsTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/vtl/VtlBindingsTest.java @@ -5,6 +5,8 @@ import fr.insee.kraftwerk.core.metadata.MetadataModel; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.rawdata.SurveyRawDataTest; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.vtl.model.Dataset; import fr.insee.vtl.model.Dataset.Role; import fr.insee.vtl.model.InMemoryDataset; @@ -25,8 +27,8 @@ class VtlBindingsTest { private VtlBindings vtlBindings; private List errors; - - VtlExecute vtlExecute = new VtlExecute(); + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + VtlExecute vtlExecute = new VtlExecute(fileUtilsInterface); Dataset ds1 = new InMemoryDataset( List.of( diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/vtl/VtlJsonDatasetWriterTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/vtl/VtlJsonDatasetWriterTest.java index c4d92e53..12fee50a 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/vtl/VtlJsonDatasetWriterTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/vtl/VtlJsonDatasetWriterTest.java @@ -5,6 +5,8 @@ import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; import fr.insee.kraftwerk.core.rawdata.SurveyRawDataTest; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.vtl.model.Dataset; import org.apache.commons.lang3.tuple.Pair; import org.junit.jupiter.api.BeforeEach; @@ -19,8 +21,9 @@ class VtlJsonDatasetWriterTest { private VtlBindings vtlBindings; - - VtlExecute vtlExecute = new VtlExecute(); + + private final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); + VtlExecute vtlExecute = new VtlExecute(fileUtilsInterface); @BeforeEach public void initVtlBindings() { diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/CalculatedProcessingDefinition.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/CalculatedProcessingDefinition.java index 77819d51..28159230 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/CalculatedProcessingDefinition.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/CalculatedProcessingDefinition.java @@ -13,6 +13,7 @@ import fr.insee.kraftwerk.core.parsers.DataParser; import fr.insee.kraftwerk.core.parsers.LunaticXmlDataParser; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; import fr.insee.vtl.model.Dataset; @@ -43,7 +44,7 @@ public class CalculatedProcessingDefinition { private Dataset outDataset; private List variableNamesList; - VtlExecute vtlExecute = new VtlExecute(); + VtlExecute vtlExecute = new VtlExecute(new FileSystemImpl()); List errors = new ArrayList<>(); @ParameterType("(?:[^,]*)(?:,\\s?[^,]*)*") @@ -64,11 +65,11 @@ public void getCampaignFiles(String campaignName, String dataMode) throws Malfor this.dataMode = dataMode; // metadataModel = DDIReader.getMetadataFromDDI( - Constants.convertToUrl(campaignPacks.get(campaignName).get(dataMode).get("ddi"))); + Constants.convertToUrl(campaignPacks.get(campaignName).get(dataMode).get("ddi")), new FileSystemImpl()); // SurveyRawData data = new SurveyRawData(); data.setMetadataModel(metadataModel); - DataParser parser = new LunaticXmlDataParser(data); + DataParser parser = new LunaticXmlDataParser(data, new FileSystemImpl()); parser.parseSurveyData(Paths.get(campaignPacks.get(campaignName).get(dataMode).get("data")),null); // vtlBindings = new VtlBindings(); @@ -80,7 +81,7 @@ public void readCampaignData() { // CalculatedVariables calculatedVariables = LunaticReader.getCalculatedFromLunatic( Path.of(campaignPacks.get(campaignName).get(dataMode).get("lunatic"))); - DataProcessing calculatedProcessing = new CalculatedProcessing(vtlBindings,calculatedVariables); + DataProcessing calculatedProcessing = new CalculatedProcessing(vtlBindings,calculatedVariables, new FileSystemImpl()); calculatedProcessing.applyVtlTransformations("TEST", null,errors); // outDataset = vtlBindings.getDataset("TEST"); diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/DDIGetterDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/DDIGetterDefinitions.java index 0ca3d85c..16224751 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/DDIGetterDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/DDIGetterDefinitions.java @@ -2,6 +2,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.utils.TextFileReader; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.utils.xsl.SaxonTransformer; import io.cucumber.java.en.Given; import io.cucumber.java.en.Then; @@ -45,7 +46,7 @@ public void compare_ddi(String nameDDI) throws IOException, URISyntaxException { SaxonTransformer transformer = new SaxonTransformer(); transformer.xslTransform(url, Constants.XSLT_STRUCTURED_VARIABLES, tempPath); - actualString = TextFileReader.readFromPath(tempPath); + actualString = TextFileReader.readFromPath(tempPath, new FileSystemImpl()); if (actualString.trim().contains("")) { actualAnswer = "DDI collected"; diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java index f2be95d1..c2f0ec78 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java @@ -86,7 +86,7 @@ public void launch_all_steps(String campaignDirectoryName) { this.campaignName = campaignDirectoryName; inDirectory = inDirectory.resolve(campaignName); outDirectory = outDirectory.resolve(campaignName); - controlInputSequence = new ControlInputSequence(inDirectory.toString()); + controlInputSequence = new ControlInputSequence(inDirectory.toString(), new FileSystemImpl()); // We clean the output and the temp directory deleteDirectory(outDirectory.toFile()); deleteDirectory(tempDirectory.toFile()); @@ -169,8 +169,8 @@ public void launch_main_filebyfile() throws KraftwerkException { @When("Step 2 : We get each unimodal dataset") public void unimodal_treatments() throws KraftwerkException, SQLException, NullException { try (Statement statement = database.createStatement()) { - metadataModelMap = MetadataUtils.getMetadata(userInputs.getModeInputsMap()); - BuildBindingsSequence buildBindingsSequence = new BuildBindingsSequence(true); + metadataModelMap = MetadataUtils.getMetadata(userInputs.getModeInputsMap(), new FileSystemImpl()); + BuildBindingsSequence buildBindingsSequence = new BuildBindingsSequence(true, new FileSystemImpl()); for (String dataMode : userInputs.getModeInputsMap().keySet()) { boolean withDDI = true; buildBindingsSequence.buildVtlBindings(userInputs, dataMode, vtlBindings, metadataModelMap.get(dataMode), withDDI, null); @@ -193,9 +193,9 @@ public void export_results() throws KraftwerkException, SQLException { try (Statement statement = database.createStatement()) { WriterSequence writerSequence = new WriterSequence(); LocalDateTime localDateTime = LocalDateTime.now(); - writerSequence.writeOutputFiles(inDirectory, localDateTime, vtlBindings, userInputs.getModeInputsMap(), metadataModelMap, errors, statement); + writerSequence.writeOutputFiles(inDirectory, localDateTime, vtlBindings, userInputs.getModeInputsMap(), metadataModelMap, errors, statement, new FileSystemImpl()); writeErrorsFile(inDirectory, localDateTime, errors); - outputFiles = new CsvOutputFiles(outDirectory, vtlBindings, userInputs.getModes(), statement); + outputFiles = new CsvOutputFiles(outDirectory, vtlBindings, userInputs.getModes(), statement, new FileSystemImpl()); } } diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java index eacedeee..664ec562 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/ParadataDefinitions.java @@ -41,7 +41,7 @@ public class ParadataDefinitions { public void launch_all_steps(String campaignName) throws KraftwerkException { Path campaignDirectory = Paths.get(FUNCTIONAL_TESTS_INPUT_DIRECTORY).resolve(campaignName); - controlInputSequence = new ControlInputSequence(campaignDirectory.toString()); + controlInputSequence = new ControlInputSequence(campaignDirectory.toString(), new FileSystemImpl()); UserInputsFile userInputs = controlInputSequence.getUserInputs(campaignDirectory, fileUtilsInterface); // For now, only one file String modeName = userInputs.getModes().getFirst(); @@ -49,8 +49,8 @@ public void launch_all_steps(String campaignName) throws KraftwerkException { // parse data data = new SurveyRawData(); data.setDataMode(modeInputs.getDataMode()); - data.setMetadataModel(DDIReader.getMetadataFromDDI(modeInputs.getDdiUrl())); - DataParser parser = DataParserManager.getParser(modeInputs.getDataFormat(), data); + data.setMetadataModel(DDIReader.getMetadataFromDDI(modeInputs.getDdiUrl(), fileUtilsInterface)); + DataParser parser = DataParserManager.getParser(modeInputs.getDataFormat(), data, fileUtilsInterface); parser.parseSurveyData(modeInputs.getDataFile(),null); // get paradata folder paradataFolder = modeInputs.getParadataFolder(); @@ -60,7 +60,7 @@ public void launch_all_steps(String campaignName) throws KraftwerkException { public void collect_paradata_test() throws NullException { if (modeInputs.getParadataFolder() != null && !modeInputs.getParadataFolder().toString().contentEquals("")) { - ParadataParser paraDataParser = new ParadataParser(); + ParadataParser paraDataParser = new ParadataParser(fileUtilsInterface); paradata = new Paradata(paradataFolder); paraDataParser.parseParadata(paradata, data); paradata.getListParadataUE().get(0).getEvents().stream().forEach(e -> log.debug(e.getTimestamp() + ","+ e.getIdParadataObject())); diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/VariablesGetterDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/VariablesGetterDefinitions.java index 4d6adef4..6a469758 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/VariablesGetterDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/VariablesGetterDefinitions.java @@ -3,6 +3,7 @@ import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.metadata.DDIReader; import fr.insee.kraftwerk.core.metadata.MetadataModel; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import io.cucumber.java.en.Given; import io.cucumber.java.en.Then; import io.cucumber.java.en.When; @@ -31,7 +32,7 @@ public void set_linkDDI(String linkDDI) throws MalformedURLException, URISyntaxE @When("I try to collect the variables's infos") public void collect_variables() throws KraftwerkException { - metadataModel = DDIReader.getMetadataFromDDI(linkDDI); + metadataModel = DDIReader.getMetadataFromDDI(linkDDI, new FileSystemImpl()); } @Then("The variables I try to count should answer {int} and have {string} in it") From 7ea617d9f81af737674e6b273b8ce9085daec2a6 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 24 Jun 2024 08:25:25 +0200 Subject: [PATCH 19/46] Removed more file system calls + unused imports + moved XML utils to xml package --- .../fr/insee/kraftwerk/api/services/SplitterService.java | 4 ++-- .../extradata/reportingdata/XMLReportingDataParser.java | 2 +- .../fr/insee/kraftwerk/core/inputs/UserInputsFile.java | 7 +++---- .../kraftwerk/core/parsers/LunaticXmlDataParser.java | 2 +- .../insee/kraftwerk/core/parsers/XformsDataParser.java | 2 +- .../core/sequence/BuildBindingsSequenceGenesis.java | 7 ++----- .../insee/kraftwerk/core/utils/files/FileSystemImpl.java | 3 --- .../fr/insee/kraftwerk/core/utils/files/MinioImpl.java | 9 +++------ .../kraftwerk/core/utils/{ => xml}/XmlFileReader.java | 2 +- .../utils/{XMLSplitter.java => xml/XmlSplitter.java} | 6 +++--- .../utils/{XMLSplitterTest.java => XmlSplitterTest.java} | 5 +++-- 11 files changed, 20 insertions(+), 29 deletions(-) rename kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/{ => xml}/XmlFileReader.java (97%) rename kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/{XMLSplitter.java => xml/XmlSplitter.java} (98%) rename kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/{XMLSplitterTest.java => XmlSplitterTest.java} (94%) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java index d0055789..b841b1f5 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java @@ -1,7 +1,7 @@ package fr.insee.kraftwerk.api.services; import fr.insee.kraftwerk.api.configuration.MinioConfig; -import fr.insee.kraftwerk.core.utils.XMLSplitter; +import fr.insee.kraftwerk.core.utils.xml.XmlSplitter; import io.swagger.v3.oas.annotations.Operation; import io.swagger.v3.oas.annotations.tags.Tag; import lombok.extern.log4j.Log4j2; @@ -31,7 +31,7 @@ public ResponseEntity saveResponsesFromXmlFile(@RequestParam("inputFolde @RequestParam("nbResponsesByFile") int nbSU) throws Exception { log.info("Split XML file : " + filename + " into " + nbSU + " SU by file"); - XMLSplitter.split(String.format("%s/in/%s/",defaultDirectory,inputFolder), filename, String.format("%s/in/%s/",defaultDirectory,outputFolder), "SurveyUnit", nbSU); + XmlSplitter.split(String.format("%s/in/%s/",defaultDirectory,inputFolder), filename, String.format("%s/in/%s/",defaultDirectory,outputFolder), "SurveyUnit", nbSU); return new ResponseEntity<>("File split", HttpStatus.OK); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/XMLReportingDataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/XMLReportingDataParser.java index 9051268f..2d037dd4 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/XMLReportingDataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/extradata/reportingdata/XMLReportingDataParser.java @@ -3,7 +3,7 @@ import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.exceptions.NullException; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; -import fr.insee.kraftwerk.core.utils.XmlFileReader; +import fr.insee.kraftwerk.core.utils.xml.XmlFileReader; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import nu.xom.Document; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java index d941c332..7b4239de 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java @@ -10,7 +10,6 @@ import lombok.Setter; import lombok.extern.log4j.Log4j2; -import java.io.File; import java.io.IOException; import java.net.URL; import java.nio.file.Path; @@ -46,12 +45,12 @@ private void readUserInputs() throws UnknownDataFormatException, MissingMandator String dataFolder = readField(fileNode, "data_file"); String paradataFolder = readField(fileNode, "paradata_folder"); String reportingFolder = readField(fileNode, "reporting_data_file"); - Path dataPath = (new File(dataFolder).exists()) ? convertToUserPath(dataFolder) : fileUtilsInterface.convertToPath(dataFolder,inputDirectory); + Path dataPath = (fileUtilsInterface.isFileExists(dataFolder)) ? convertToUserPath(dataFolder) : fileUtilsInterface.convertToPath(dataFolder,inputDirectory); URL ddiFile = fileUtilsInterface.convertToUrl(readField(fileNode, "DDI_file"),inputDirectory); Path lunaticFile = fileUtilsInterface.convertToPath(readField(fileNode, "lunatic_file"),inputDirectory); String dataFormat = readField(fileNode, "data_format"); - Path paradataPath = (paradataFolder != null && new File(paradataFolder).exists()) ? convertToUserPath(paradataFolder) : fileUtilsInterface.convertToPath(paradataFolder,inputDirectory); - Path reportingDataFile = (reportingFolder != null && new File(reportingFolder).exists()) ? convertToUserPath(reportingFolder) : fileUtilsInterface.convertToPath(reportingFolder,inputDirectory); + Path paradataPath = (paradataFolder != null && fileUtilsInterface.isFileExists(paradataFolder)) ? convertToUserPath(paradataFolder) : fileUtilsInterface.convertToPath(paradataFolder,inputDirectory); + Path reportingDataFile = (reportingFolder != null && fileUtilsInterface.isFileExists(reportingFolder)) ? convertToUserPath(reportingFolder) : fileUtilsInterface.convertToPath(reportingFolder,inputDirectory); Path vtlFile = fileUtilsInterface.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); ModeInputs modeInputs = new ModeInputs(); modeInputs.setDataFile(dataPath); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java index 17d83365..b325748e 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java @@ -6,7 +6,7 @@ import fr.insee.kraftwerk.core.rawdata.GroupInstance; import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; -import fr.insee.kraftwerk.core.utils.XmlFileReader; +import fr.insee.kraftwerk.core.utils.xml.XmlFileReader; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import nu.xom.Document; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/XformsDataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/XformsDataParser.java index 89f8df35..f1f74ad2 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/XformsDataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/XformsDataParser.java @@ -4,7 +4,7 @@ import fr.insee.kraftwerk.core.rawdata.GroupInstance; import fr.insee.kraftwerk.core.rawdata.QuestionnaireData; import fr.insee.kraftwerk.core.rawdata.SurveyRawData; -import fr.insee.kraftwerk.core.utils.XmlFileReader; +import fr.insee.kraftwerk.core.utils.xml.XmlFileReader; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import nu.xom.Document; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java index c931078a..f75e127e 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java @@ -20,7 +20,6 @@ import fr.insee.kraftwerk.core.vtl.VtlBindings; import fr.insee.kraftwerk.core.vtl.VtlExecute; -import java.io.File; import java.nio.file.Path; import java.sql.Statement; import java.util.List; @@ -85,8 +84,7 @@ public void buildVtlBindings(String dataMode, VtlBindings vtlBindings, Map listFiles = fileUtilsInterface.listFiles(reportingDataFile.toString()); for (String file : listFiles) { ReportingData reportingData = new ReportingData(reportingDataFile.resolve(file)); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index b4dadd40..1f382f9b 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -11,11 +11,8 @@ import javax.annotation.Nullable; import java.io.File; -import java.io.FileNotFoundException; -import java.io.FileOutputStream; import java.io.IOException; import java.io.InputStream; -import java.io.OutputStream; import java.net.MalformedURLException; import java.net.URI; import java.net.URISyntaxException; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java index 268708ec..a97b6244 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -21,9 +21,7 @@ import lombok.extern.slf4j.Slf4j; import java.io.ByteArrayInputStream; -import java.io.File; import java.io.InputStream; -import java.io.OutputStream; import java.net.MalformedURLException; import java.net.URI; import java.net.URISyntaxException; @@ -32,7 +30,6 @@ import java.util.ArrayList; import java.util.Arrays; import java.util.List; -import java.util.regex.Pattern; @Slf4j @AllArgsConstructor @@ -62,7 +59,7 @@ public void renameInputFile(Path inDirectory) { public void archiveInputFiles(UserInputsFile userInputsFile) throws KraftwerkException { // Path inputFolder = userInputsFile.getInputDirectory(); - String[] directories = inputFolder.toString().split(Pattern.quote(File.separator)); + String[] directories = inputFolder.toString().split("/"); String campaignName = directories[directories.length - 1]; // @@ -290,14 +287,14 @@ private void archiveReportingData(Path inputFolder, String campaignName, ModeInp } private String getRoot(Path path, String campaignName) { - String[] directories = path.toString().split(Pattern.quote(File.separator)); + String[] directories = path.toString().split("/"); int campaignIndex = Arrays.asList(directories).indexOf(campaignName); String[] newDirectories = Arrays.copyOfRange(directories, campaignIndex + 1, directories.length); StringBuilder result = new StringBuilder(); String sep = ""; for (String directory : newDirectories) { result.append(sep).append(directory); - sep = File.separator; + sep = "/"; } return result.toString(); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XmlFileReader.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xml/XmlFileReader.java similarity index 97% rename from kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XmlFileReader.java rename to kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xml/XmlFileReader.java index 85e9d35f..52eebf8f 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XmlFileReader.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xml/XmlFileReader.java @@ -1,4 +1,4 @@ -package fr.insee.kraftwerk.core.utils; +package fr.insee.kraftwerk.core.utils.xml; import java.io.IOException; import java.io.InputStream; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xml/XmlSplitter.java similarity index 98% rename from kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java rename to kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xml/XmlSplitter.java index f5507761..623263a7 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/XMLSplitter.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xml/XmlSplitter.java @@ -1,4 +1,4 @@ -package fr.insee.kraftwerk.core.utils; +package fr.insee.kraftwerk.core.utils.xml; import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; @@ -15,11 +15,11 @@ import java.util.ArrayList; import java.util.List; -public class XMLSplitter { +public class XmlSplitter { //TODO Make it work with MinIO // We use StAX in this class to deal with memory issues on huge XML files - private XMLSplitter() { + private XmlSplitter() { throw new IllegalStateException("Utility class"); } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XMLSplitterTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XmlSplitterTest.java similarity index 94% rename from kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XMLSplitterTest.java rename to kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XmlSplitterTest.java index ea3835a6..bc530286 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XMLSplitterTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XmlSplitterTest.java @@ -3,6 +3,7 @@ import fr.insee.kraftwerk.core.TestConstants; import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.xml.XmlSplitter; import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.api.DisplayName; import org.junit.jupiter.api.Test; @@ -22,7 +23,7 @@ import static org.junit.Assert.assertEquals; -class XMLSplitterTest { +class XmlSplitterTest { static final String outDirectory = TestConstants.UNIT_TESTS_DUMP+"/split/"; @@ -41,7 +42,7 @@ static void cleanUpBeforeTests() throws Exception { } } } - XMLSplitter.split(TestConstants.UNIT_TESTS_DIRECTORY+"/data/lunatic_xml/", "fake-lunatic-data-1.xml", + XmlSplitter.split(TestConstants.UNIT_TESTS_DIRECTORY+"/data/lunatic_xml/", "fake-lunatic-data-1.xml", outDirectory,"SurveyUnit",2); } From dd3d86973a8f94c1df3773b135eaf9f3efb298f5 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 24 Jun 2024 09:51:33 +0200 Subject: [PATCH 20/46] Adapted Xml Splitter and CSV/Parquet output to be able to use minio --- .../api/services/SplitterService.java | 19 ++- .../core/dataprocessing/DataProcessing.java | 1 - .../core/outputs/csv/CsvOutputFiles.java | 19 +-- .../outputs/parquet/ParquetOutputFiles.java | 12 +- .../core/utils/files/FileSystemImpl.java | 30 ++-- .../core/utils/files/FileSystemType.java | 6 + .../core/utils/files/FileUtilsInterface.java | 16 +++ .../kraftwerk/core/utils/files/MinioImpl.java | 45 ++++-- .../kraftwerk/core/utils/xml/XmlSplitter.java | 133 +++++++++--------- .../kraftwerk/core/utils/XmlSplitterTest.java | 3 +- 10 files changed, 182 insertions(+), 102 deletions(-) create mode 100644 kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemType.java diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java index b841b1f5..c8fdbca8 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java @@ -1,7 +1,12 @@ package fr.insee.kraftwerk.api.services; import fr.insee.kraftwerk.api.configuration.MinioConfig; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileSystemType; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; +import fr.insee.kraftwerk.core.utils.files.MinioImpl; import fr.insee.kraftwerk.core.utils.xml.XmlSplitter; +import io.minio.MinioClient; import io.swagger.v3.oas.annotations.Operation; import io.swagger.v3.oas.annotations.tags.Tag; import lombok.extern.log4j.Log4j2; @@ -16,7 +21,6 @@ @Tag(name = "${tag.splitter}") @Log4j2 public class SplitterService extends KraftwerkService{ -//TODO add MinIO support @Autowired public SplitterService(MinioConfig minioConfig) { @@ -28,10 +32,17 @@ public SplitterService(MinioConfig minioConfig) { public ResponseEntity saveResponsesFromXmlFile(@RequestParam("inputFolder") String inputFolder, @RequestParam("outputFolder") String outputFolder, @RequestParam("filename") String filename, - @RequestParam("nbResponsesByFile") int nbSU) + @RequestParam("nbResponsesByFile") int nbSU, + @RequestParam("fileSystemType") FileSystemType fileSystemType) throws Exception { - log.info("Split XML file : " + filename + " into " + nbSU + " SU by file"); - XmlSplitter.split(String.format("%s/in/%s/",defaultDirectory,inputFolder), filename, String.format("%s/in/%s/",defaultDirectory,outputFolder), "SurveyUnit", nbSU); + log.info("Split XML file : " + filename + " into " + nbSU + " SU by file using " + + (fileSystemType.equals(FileSystemType.MINIO) ? "Minio" : "OS file system")); + + FileUtilsInterface fileUtilsInterface = fileSystemType.equals(FileSystemType.MINIO) ? + new MinioImpl(MinioClient.builder().credentials(minioConfig.getAccessKey(),minioConfig.getSecretKey()).endpoint(minioConfig.getEndpoint()).build(), minioConfig.getBucketName()) : + new FileSystemImpl(); + + XmlSplitter.split(String.format("%s/in/%s/",defaultDirectory,inputFolder), filename, String.format("%s/in/%s/",defaultDirectory,outputFolder), "SurveyUnit", nbSU, fileUtilsInterface); return new ResponseEntity<>("File split", HttpStatus.OK); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessing.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessing.java index f5a60433..27f58748 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessing.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/dataprocessing/DataProcessing.java @@ -69,7 +69,6 @@ protected String applyAutomatedVtlInstructions(String bindingName, List errors){ - //TODO change to interface String vtlScript = TextFileReader.readFromPath(userVtlInstructionsPath, fileUtilsInterface); log.info(String.format("User VTL instructions read for step %s:%n%s", getStepName(), vtlScript)); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java index 43837c12..ded7586e 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java @@ -56,8 +56,10 @@ public CsvOutputFiles(Path outDirectory, VtlBindings vtlBindings, KraftwerkExecu @Override public void writeOutputTables(Map metadataModels) throws KraftwerkException { for (String datasetName : getDatasetToCreate()) { - File outputFile = getOutputFolder().resolve(outputFileName(datasetName)).toFile(); try { + //Temporary file + File tmpOutputFile = File.createTempFile(outputFileName(datasetName), null); + //Get column names List columnNames = SqlUtils.getColumnNames(getDatabase(), datasetName); @@ -72,10 +74,10 @@ public void writeOutputTables(Map metadataModels) throws List boolColumnIndexes = new ArrayList<>(); //Create file with double quotes header - Files.write(outputFile.toPath(), buildHeader(columnNames, boolColumnNames, boolColumnIndexes).getBytes()); + Files.write(tmpOutputFile.toPath(), buildHeader(columnNames, boolColumnNames, boolColumnIndexes).getBytes()); //Data export into temp file - StringBuilder exportCsvQuery = new StringBuilder(String.format("COPY %s TO '%s' (FORMAT CSV, HEADER false, DELIMITER '%s', OVERWRITE_OR_IGNORE true", datasetName, outputFile.getAbsolutePath() +"data", Constants.CSV_OUTPUTS_SEPARATOR)); + StringBuilder exportCsvQuery = new StringBuilder(String.format("COPY %s TO '%s' (FORMAT CSV, HEADER false, DELIMITER '%s', OVERWRITE_OR_IGNORE true", datasetName, tmpOutputFile.getAbsolutePath() +"data", Constants.CSV_OUTPUTS_SEPARATOR)); //Double quote values parameter exportCsvQuery.append(", FORCE_QUOTE("); for (String stringColumnName : columnNames) { @@ -90,18 +92,21 @@ public void writeOutputTables(Map metadataModels) throws //Merge data file with header file //Read line by line to avoid memory waste - try(BufferedReader bufferedReader = Files.newBufferedReader(Path.of(outputFile.toPath().toAbsolutePath() + "data"))){ + try(BufferedReader bufferedReader = Files.newBufferedReader(Path.of(tmpOutputFile.toPath().toAbsolutePath() + "data"))){ String line = bufferedReader.readLine(); while(line != null){ //Apply transformations to elements line = applyNullTransformation(line); line = applyBooleanTransformations(line, boolColumnIndexes); - Files.write(outputFile.toPath(),(line + "\n").getBytes(),StandardOpenOption.APPEND); + Files.write(tmpOutputFile.toPath(),(line + "\n").getBytes(),StandardOpenOption.APPEND); line = bufferedReader.readLine(); } } - Files.deleteIfExists(Path.of(outputFile.toPath().toAbsolutePath() + "data")); + Files.deleteIfExists(Path.of(tmpOutputFile.toPath().toAbsolutePath() + "data")); + + //Move to output folder + getFileUtilsInterface().moveFile(tmpOutputFile.toPath().toAbsolutePath(), getOutputFolder().resolve(outputFileName(datasetName)).toString()); //Count rows for functional log if (kraftwerkExecutionLog != null) { @@ -110,8 +115,6 @@ public void writeOutputTables(Map metadataModels) throws kraftwerkExecutionLog.getLineCountByTableMap().put(datasetName, countResult.getInt(1)); } } - - //TODO export to minio } catch (SQLException | IOException e) { throw new KraftwerkException(500, e.toString()); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java index feb36062..275fd2f2 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java @@ -52,12 +52,16 @@ public ParquetOutputFiles(Path outDirectory, VtlBindings vtlBindings, List metadataModels) throws KraftwerkException { for (String datasetName : getDatasetToCreate()) { - File outputFile = getOutputFolder().resolve(outputFileName(datasetName)).toFile(); try { - Files.deleteIfExists(outputFile.toPath()); + File tmpOutputFile = File.createTempFile(outputFileName(datasetName), null); + + Files.deleteIfExists(tmpOutputFile.toPath()); //Data export - getDatabase().execute(String.format("COPY %s TO '%s' (FORMAT PARQUET)", datasetName, outputFile.getAbsolutePath())); - //TODO export to minio + getDatabase().execute(String.format("COPY %s TO '%s' (FORMAT PARQUET)", datasetName, tmpOutputFile.getAbsolutePath())); + + + //Move to output folder + getFileUtilsInterface().moveFile(tmpOutputFile.toPath().toAbsolutePath(), getOutputFolder().resolve(outputFileName(datasetName)).toString()); } catch (Exception e) { throw new KraftwerkException(500, e.toString()); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index 1f382f9b..7144a60a 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -19,6 +19,7 @@ import java.net.URL; import java.nio.file.Files; import java.nio.file.Path; +import java.nio.file.StandardCopyOption; import java.nio.file.StandardOpenOption; import java.util.Arrays; import java.util.List; @@ -89,6 +90,8 @@ public void deleteDirectory(Path directoryPath) throws KraftwerkException { */ @Override public List listFiles(String dir) { + File dirFile = new File(dir); + return Stream.of(new File(dir).listFiles()) .filter(file -> !file.isDirectory()) .map(File::getName) @@ -169,6 +172,7 @@ public long getSizeOf(String path) { @Override public void writeFile(String path, String toWrite, boolean replace) { + createDirectoryIfNotExist(Path.of(path)); StandardOpenOption standardOpenOption = replace || !isFileExists(path) ? StandardOpenOption.CREATE : StandardOpenOption.APPEND; try { Files.write(Path.of(path), toWrite.getBytes(), standardOpenOption); @@ -221,6 +225,22 @@ private void archiveReportingData(Path inputFolder, String campaignName, ModeInp } } + @Override + public void moveFile(String srcPath, String dstPath) throws KraftwerkException { + try { + createDirectoryIfNotExist(Path.of(dstPath).getParent()); + Files.move(Path.of(srcPath), Path.of(dstPath), StandardCopyOption.REPLACE_EXISTING); + } catch (IOException e) { + throw new KraftwerkException(500, "Can't move file " + srcPath + " to " + dstPath); + } + } + + @Override + public void moveFile(Path fileSystemPath, String dstPath) throws KraftwerkException { + //Same than other moveFile + moveFile(fileSystemPath.toString(), dstPath); + } + /** * If paradata, we move the paradata folder * @param inputFolder @@ -245,7 +265,7 @@ private void archiveData(Path inputFolder, String campaignName, ModeInputs modeI new File(newDataPath.getParent().toString()).mkdirs(); } if (Files.isRegularFile(dataPath)) { - moveFile(dataPath, newDataPath); + moveFile(dataPath.toString(), newDataPath.toString()); } else if (Files.isDirectory(dataPath)) { moveDirectory(dataPath.toFile(),newDataPath.toFile()); } else { @@ -259,14 +279,6 @@ private void createArchiveDirectoryIfNotExists(Path inputFolder) { } } - private void moveFile(Path dataPath, Path newDataPath) throws KraftwerkException { - try { - Files.move(dataPath, newDataPath); - } catch (IOException e) { - throw new KraftwerkException(500, "Can't move file " + dataPath + " to " + newDataPath); - } - } - private void moveDirectory(File sourceFile, File destFile) throws KraftwerkException { if (sourceFile.isDirectory()) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemType.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemType.java new file mode 100644 index 00000000..aa29915b --- /dev/null +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemType.java @@ -0,0 +1,6 @@ +package fr.insee.kraftwerk.core.utils.files; + +public enum FileSystemType { + OS_FILESYSTEM, + MINIO +} diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java index a8291a8d..b1663db6 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java @@ -89,4 +89,20 @@ private static Path transformToOther(Path inDirectory, String other) { InputStream readFile(String path); boolean isFileExists(String path); + + /** + * Move file from source to destination (depends of the file system) + * @param srcPath source path + * @param dstPath destination path + * @throws KraftwerkException + */ + void moveFile(String srcPath, String dstPath) throws KraftwerkException; + + /** + * Move file from local file system to another path + * @param fileSystemPath local path + * @param dstPath destination path + * @throws KraftwerkException + */ + void moveFile(Path fileSystemPath, String dstPath) throws KraftwerkException; } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java index a97b6244..11c21032 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -21,11 +21,13 @@ import lombok.extern.slf4j.Slf4j; import java.io.ByteArrayInputStream; +import java.io.FileInputStream; import java.io.InputStream; import java.net.MalformedURLException; import java.net.URI; import java.net.URISyntaxException; import java.net.URL; +import java.nio.file.Files; import java.nio.file.Path; import java.util.ArrayList; import java.util.Arrays; @@ -52,7 +54,11 @@ public void renameInputFile(Path inDirectory) { log.warn("Timestamped input file will be over-written."); deleteFile(file2MinioPathString); } - moveFile(file1MinioPathString, file2MinioPathString); + try { + moveFile(file1MinioPathString, file2MinioPathString); + }catch (Exception e){ + log.error(e.toString()); + } } @Override @@ -200,9 +206,33 @@ public boolean isFileExists(String objectPath) { } } + @Override + public void moveFile(String srcMinioPath, String dstMinioPath) throws KraftwerkException { + try { + copyFile(srcMinioPath, dstMinioPath); + deleteFile(srcMinioPath); + } catch (Exception e) { + throw new KraftwerkException(500, "Can't move file " + srcMinioPath + " to " + dstMinioPath); + } + } + + @Override + public void moveFile(Path fileSystemPath, String dstMinioPath) throws KraftwerkException { + try (InputStream inputStream = new FileInputStream(fileSystemPath.toFile())){ + writeFileOnMinio(dstMinioPath, inputStream, Files.size(fileSystemPath)); + } catch (Exception e) { + throw new KraftwerkException(500, "Can't move file " + fileSystemPath + " to " + dstMinioPath); + } + try { + Files.deleteIfExists(fileSystemPath); + }catch (Exception e) { + log.error("Error during file system file deletion : " + e); + } + } + //Utilities - private void writeFileOnMinio(String minioPath, InputStream inputStream, int fileSize) { + private void writeFileOnMinio(String minioPath, InputStream inputStream, long fileSize) { try { minioClient.putObject(PutObjectArgs.builder().bucket(bucketName).stream(inputStream, fileSize, -1).object(minioPath).build()); } catch (Exception e) { @@ -219,15 +249,6 @@ private void copyFile(String srcMinioPath, String dstMinioPath) { } } - private void moveFile(String srcMinioPath, String dstMinioPath) { - try { - copyFile(srcMinioPath, dstMinioPath); - deleteFile(srcMinioPath); - } catch (Exception e) { - log.error(e.toString()); - } - } - private void moveDirectory(String srcMinioPath, String dstMinioPath) { try { for (String filePath : listFiles(srcMinioPath)) { @@ -255,7 +276,7 @@ private void deleteFile(String minioPath) { - private void archiveData(Path inputFolder, String campaignName, ModeInputs modeInputs) { + private void archiveData(Path inputFolder, String campaignName, ModeInputs modeInputs) throws KraftwerkException{ Path dataPath = modeInputs.getDataFile(); Path newDataPath = inputFolder.resolve(ARCHIVE).resolve(getRoot(dataPath, campaignName)); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xml/XmlSplitter.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xml/XmlSplitter.java index 623263a7..1870e04b 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xml/XmlSplitter.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xml/XmlSplitter.java @@ -1,73 +1,78 @@ package fr.insee.kraftwerk.core.utils.xml; -import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.exceptions.KraftwerkException; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import javax.xml.stream.*; import javax.xml.stream.events.EndDocument; import javax.xml.stream.events.StartDocument; import javax.xml.stream.events.StartElement; import javax.xml.stream.events.XMLEvent; -import java.io.FileNotFoundException; -import java.io.FileReader; +import java.io.File; import java.io.FileWriter; import java.io.IOException; -import java.nio.file.Paths; +import java.io.InputStream; import java.util.ArrayList; import java.util.List; public class XmlSplitter { - //TODO Make it work with MinIO // We use StAX in this class to deal with memory issues on huge XML files private XmlSplitter() { throw new IllegalStateException("Utility class"); } - public static void split(String inputfolder, String xmlfile, String outputFolder, String condition, int nbElementsByFile) throws XMLStreamException, IOException { - - FileSystemImpl.createDirectoryIfNotExist(Paths.get(outputFolder)); + public static void split(String inputfolder, String xmlfile, String outputFolder, String condition, int nbElementsByFile, FileUtilsInterface fileUtilsInterface) throws XMLStreamException, IOException, KraftwerkException { String xmlResource = inputfolder + xmlfile; - List header = getHeader(xmlResource, condition); + List header = getHeader(xmlResource, condition, fileUtilsInterface); XMLEventFactory xef = XMLEventFactory.newFactory(); XMLInputFactory xif = XMLInputFactory.newInstance(); xif.setProperty(XMLInputFactory.SUPPORT_DTD, false); xif.setProperty(XMLInputFactory.IS_SUPPORTING_EXTERNAL_ENTITIES, false); - XMLEventReader xer = xif.createXMLEventReader(new FileReader(xmlResource)); - StartElement rootStartElement = xer.nextTag().asStartElement(); - StartDocument startDocument = xef.createStartDocument(); - EndDocument endDocument = xef.createEndDocument(); - - XMLOutputFactory xof = XMLOutputFactory.newFactory(); - int fileCount = 1; - while(xer.hasNext() && !xer.peek().isEndDocument()) { - XMLEvent xmlEvent = xer.nextEvent(); - - if (isStartElementWithName(condition, xmlEvent)) { - // Create a file for the fragment, the name is derived from the value of the id attribute - FileWriter fileWriter = new FileWriter(outputFolder + "split" + fileCount + ".xml"); - - // A StAX XMLEventWriter will be used to write the XML fragment - XMLEventWriter xew = xof.createXMLEventWriter(fileWriter); - xew.add(startDocument); - // Add the elements which are common to all split files - addHeadersToNewFile(header, xew); + try (InputStream inputStream = fileUtilsInterface.readFile(xmlResource)) { + XMLEventReader xer = xif.createXMLEventReader(inputStream); + StartElement rootStartElement = xer.nextTag().asStartElement(); + StartDocument startDocument = xef.createStartDocument(); + EndDocument endDocument = xef.createEndDocument(); - // Write the XMLEvents that are part of SurveyUnit element - xew.add(xmlEvent); - xmlEvent = xer.nextEvent(); - int nbResponses = 1; - // We loop until we reach the end tag Survey units indicating the near end of the document - iterateOnSurveyUnits(condition, nbElementsByFile, xer, xmlEvent, xew, nbResponses); - - // Write the file, close everything we opened and update the file's counter - xew.add(xef.createEndElement(rootStartElement.getName(), null)); - xew.add(endDocument); - fileWriter.close(); - - fileCount++; + XMLOutputFactory xof = XMLOutputFactory.newFactory(); + int fileCount = 1; + while (xer.hasNext() && !xer.peek().isEndDocument()) { + XMLEvent xmlEvent = xer.nextEvent(); + if (isStartElementWithName(condition, xmlEvent)) { + // Create a temp file for the fragment, the name is derived from the value of the id attribute + String tempFileName = "split" + fileCount; + File tempFile = File.createTempFile(outputFolder + tempFileName,null); + FileWriter fileWriter = new FileWriter(tempFile); + + // A StAX XMLEventWriter will be used to write the XML fragment + XMLEventWriter xew = xof.createXMLEventWriter(fileWriter); + xew.add(startDocument); + + // Add the elements which are common to all split files + addHeadersToNewFile(header, xew); + + // Write the XMLEvents that are part of SurveyUnit element + xew.add(xmlEvent); + xmlEvent = xer.nextEvent(); + int nbResponses = 1; + // We loop until we reach the end tag Survey units indicating the near end of the document + iterateOnSurveyUnits(condition, nbElementsByFile, xer, xmlEvent, xew, nbResponses); + + // Write the file, close everything we opened and + xew.add(xef.createEndElement(rootStartElement.getName(), null)); + xew.add(endDocument); + fileWriter.close(); + + //Move to outputFolder + fileUtilsInterface.moveFile(tempFile.getAbsolutePath(), outputFolder + "/" + tempFileName + ".xml"); + + //Update the file's counter + fileCount++; + } } } } @@ -102,32 +107,34 @@ private static boolean isEndElementWithName(XMLEvent xmlEvent, String condition) return xmlEvent.isEndElement() && xmlEvent.asEndElement().getName().getLocalPart().equals(condition); } - private static List getHeader(String xmlResource, String condition) throws FileNotFoundException, XMLStreamException { - XMLInputFactory xif = XMLInputFactory.newInstance(); - xif.setProperty(XMLInputFactory.SUPPORT_DTD, false); - xif.setProperty(XMLInputFactory.IS_SUPPORTING_EXTERNAL_ENTITIES, false); - XMLEventReader xer = xif.createXMLEventReader(new FileReader(xmlResource)); - - List cachedXMLEvents = new ArrayList<>(); - while(xer.hasNext() && !xer.peek().isEndDocument()) { - XMLEvent xmlEvent = xer.nextTag(); - if (!xmlEvent.isStartElement()) { - break; - } - StartElement breakStartElement = xmlEvent.asStartElement(); - - cachedXMLEvents.add(breakStartElement); - xmlEvent = xer.nextEvent(); - while (!(xmlEvent.isEndElement() && xmlEvent.asEndElement().getName().equals(breakStartElement.getName()))) { - if (isStartElementWithName(condition, xmlEvent)) { - xer.close(); - return cachedXMLEvents; + private static List getHeader(String xmlResource, String condition, FileUtilsInterface fileUtilsInterface) throws IOException, XMLStreamException { + try(InputStream inputStream = fileUtilsInterface.readFile(xmlResource)) { + XMLInputFactory xif = XMLInputFactory.newInstance(); + xif.setProperty(XMLInputFactory.SUPPORT_DTD, false); + xif.setProperty(XMLInputFactory.IS_SUPPORTING_EXTERNAL_ENTITIES, false); + XMLEventReader xer = xif.createXMLEventReader(inputStream); + + List cachedXMLEvents = new ArrayList<>(); + while (xer.hasNext() && !xer.peek().isEndDocument()) { + XMLEvent xmlEvent = xer.nextTag(); + if (!xmlEvent.isStartElement()) { + break; } - cachedXMLEvents.add(xmlEvent); + StartElement breakStartElement = xmlEvent.asStartElement(); + + cachedXMLEvents.add(breakStartElement); xmlEvent = xer.nextEvent(); + while (!(xmlEvent.isEndElement() && xmlEvent.asEndElement().getName().equals(breakStartElement.getName()))) { + if (isStartElementWithName(condition, xmlEvent)) { + xer.close(); + return cachedXMLEvents; + } + cachedXMLEvents.add(xmlEvent); + xmlEvent = xer.nextEvent(); + } } + xer.close(); } - xer.close(); return List.of(); } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XmlSplitterTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XmlSplitterTest.java index bc530286..57fa468c 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XmlSplitterTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XmlSplitterTest.java @@ -2,6 +2,7 @@ import fr.insee.kraftwerk.core.TestConstants; import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileSystemType; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.xml.XmlSplitter; import org.junit.jupiter.api.BeforeAll; @@ -43,7 +44,7 @@ static void cleanUpBeforeTests() throws Exception { } } XmlSplitter.split(TestConstants.UNIT_TESTS_DIRECTORY+"/data/lunatic_xml/", "fake-lunatic-data-1.xml", - outDirectory,"SurveyUnit",2); + outDirectory,"SurveyUnit",2, new FileSystemImpl()); } @Test From acad2b79d082cb73e729a346d00579c622b72beb Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 24 Jun 2024 10:29:35 +0200 Subject: [PATCH 21/46] Refactos and interface reorder --- .../kraftwerk/api/services/MainService.java | 19 ++- .../api/services/StepByStepService.java | 32 ++--- .../kraftwerk/core/parsers/DataParser.java | 1 - .../BuildBindingsSequenceGenesis.java | 2 +- .../insee/kraftwerk/core/utils/CsvUtils.java | 1 - .../core/utils/files/FileSystemImpl.java | 6 +- .../core/utils/files/FileUtilsInterface.java | 115 +++++++++++------- .../kraftwerk/core/utils/files/MinioImpl.java | 14 ++- .../kraftwerk/core/utils/XmlSplitterTest.java | 7 +- 9 files changed, 118 insertions(+), 79 deletions(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java index 78b2a8ea..3eff6461 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java @@ -14,6 +14,7 @@ import io.swagger.v3.oas.annotations.Operation; import io.swagger.v3.oas.annotations.Parameter; import io.swagger.v3.oas.annotations.tags.Tag; +import lombok.extern.slf4j.Slf4j; import org.springframework.beans.factory.annotation.Autowired; import org.springframework.http.HttpStatus; import org.springframework.http.ResponseEntity; @@ -26,19 +27,27 @@ @RestController +@Slf4j @Tag(name = "${tag.main}") public class MainService extends KraftwerkService { ConfigProperties configProperties; MinioClient minioClient; + boolean useMinio; + @Autowired public MainService(ConfigProperties configProperties, MinioConfig minioConfig) { super(minioConfig); this.configProperties = configProperties; this.minioConfig = minioConfig; - if(minioConfig.isEnable()){ + useMinio = false; + if(minioConfig == null){ + log.warn("Minio config null !"); + } + if(minioConfig != null && minioConfig.isEnable()){ minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); + useMinio = true; } } @@ -52,7 +61,7 @@ public ResponseEntity mainService( boolean fileByFile = false; boolean withDDI = true; FileUtilsInterface fileUtilsInterface; - if(Boolean.TRUE.equals(minioConfig.isEnable())){ + if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); }else{ fileUtilsInterface = new FileSystemImpl(); @@ -81,7 +90,7 @@ public ResponseEntity mainFileByFile( boolean withAllReportingData = false; boolean withDDI = true; FileUtilsInterface fileUtilsInterface; - if(Boolean.TRUE.equals(minioConfig.isEnable())){ + if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); }else{ fileUtilsInterface = new FileSystemImpl(); @@ -109,7 +118,7 @@ public ResponseEntity mainLunaticOnly( boolean fileByFile = false; boolean withAllReportingData = false; FileUtilsInterface fileUtilsInterface; - if(Boolean.TRUE.equals(minioConfig.isEnable())){ + if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); }else{ fileUtilsInterface = new FileSystemImpl(); @@ -132,7 +141,7 @@ public ResponseEntity mainLunaticOnly( public ResponseEntity mainGenesis( @Parameter(description = "${param.idCampaign}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String idCampaign) { FileUtilsInterface fileUtilsInterface; - if(Boolean.TRUE.equals(minioConfig.isEnable())){ + if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); }else{ fileUtilsInterface = new FileSystemImpl(); diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java index 39fa9c98..db707c34 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java @@ -19,6 +19,7 @@ import io.swagger.v3.oas.annotations.Operation; import io.swagger.v3.oas.annotations.Parameter; import io.swagger.v3.oas.annotations.tags.Tag; +import lombok.extern.slf4j.Slf4j; import org.springframework.beans.factory.annotation.Autowired; import org.springframework.http.ResponseEntity; import org.springframework.web.bind.annotation.*; @@ -37,17 +38,23 @@ @RestController @Tag(name = "${tag.stepbystep}") +@Slf4j public class StepByStepService extends KraftwerkService { MinioClient minioClient; + boolean useMinio; @Autowired public StepByStepService(MinioConfig minioConfig) { super(minioConfig); - //TODO warn if enable null - if(minioConfig.isEnable()){ + useMinio = false; + if(minioConfig == null){ + log.warn("Minio config null !"); + } + if(minioConfig != null && minioConfig.isEnable()){ minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); + useMinio = true; } - } + } @PutMapping(value = "/buildVtlBindings") @Operation(operationId = "buildVtlBindings", summary = "${summary.buildVtlBindings}", description = "${description.buildVtlBindings}") @@ -59,7 +66,7 @@ public ResponseEntity buildVtlBindings( boolean fileByFile = false; boolean withDDI = true; FileUtilsInterface fileUtilsInterface; - if(Boolean.TRUE.equals(minioConfig.isEnable())){ + if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); }else{ fileUtilsInterface = new FileSystemImpl(); @@ -103,7 +110,7 @@ public ResponseEntity buildVtlBindingsByDataMode( boolean fileByFile = false; boolean withDDI = true; FileUtilsInterface fileUtilsInterface; - if(Boolean.TRUE.equals(minioConfig.isEnable())){ + if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); }else{ fileUtilsInterface = new FileSystemImpl(); @@ -140,7 +147,7 @@ public ResponseEntity unimodalProcessing( @Parameter(description = "${param.dataMode}", required = true) @RequestParam String dataMode ) { FileUtilsInterface fileUtilsInterface; - if(Boolean.TRUE.equals(minioConfig.isEnable())){ + if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); }else{ fileUtilsInterface = new FileSystemImpl(); @@ -188,7 +195,7 @@ public ResponseEntity multimodalProcessing( @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam ) { FileUtilsInterface fileUtilsInterface; - if(Boolean.TRUE.equals(minioConfig.isEnable())){ + if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); }else{ fileUtilsInterface = new FileSystemImpl(); @@ -245,7 +252,7 @@ public ResponseEntity writeOutputFiles( @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam ) throws KraftwerkException, SQLException { FileUtilsInterface fileUtilsInterface; - if(Boolean.TRUE.equals(minioConfig.isEnable())){ + if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); }else{ fileUtilsInterface = new FileSystemImpl(); @@ -262,7 +269,7 @@ public ResponseEntity writeOutputFiles( List errors = new ArrayList<>(); // Read all bindings necessary to produce output String path = FileUtilsInterface.transformToTemp(inDirectory).toString(); - List fileNames = fileUtilsInterface.listFiles(path); + List fileNames = fileUtilsInterface.listFileNames(path); fileNames = fileNames.stream().filter(name -> name.endsWith(StepEnum.MULTIMODAL_PROCESSING.getStepLabel()+JSON)).toList(); for (String name : fileNames){ String pathBindings = path + File.separator + name; @@ -291,7 +298,7 @@ public ResponseEntity writeOutputFiles( public ResponseEntity archiveService( @Parameter(description = "${param.inDirectory}", required = true, example = INDIRECTORY_EXAMPLE) @RequestBody String inDirectoryParam) { FileUtilsInterface fileUtilsInterface; - if(Boolean.TRUE.equals(minioConfig.isEnable())){ + if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); }else{ fileUtilsInterface = new FileSystemImpl(); @@ -299,9 +306,4 @@ public ResponseEntity archiveService( return archive(inDirectoryParam, fileUtilsInterface); } - - - - - } \ No newline at end of file diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParser.java index 214f35ca..9eb1ee11 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/DataParser.java @@ -13,7 +13,6 @@ */ @Log4j2 public abstract class DataParser { - //TODO replace Path objects to String public static final String DATAPATH_IS_NULL = "Datapath is null"; protected final SurveyRawData data; protected final FileUtilsInterface fileUtilsInterface; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java index f75e127e..7365372d 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java @@ -94,7 +94,7 @@ private void parseParadata(String dataMode, SurveyRawData data, Path inDirectory private void parseReportingData(String dataMode, SurveyRawData data, Path inDirectory, FileUtilsInterface fileUtilsInterface) throws KraftwerkException, NullException { Path reportingDataFile = inDirectory.resolve(dataMode+Constants.REPORTING_DATA_FOLDER); if (fileUtilsInterface.isFileExists(reportingDataFile.toString())) { - List listFiles = fileUtilsInterface.listFiles(reportingDataFile.toString()); + List listFiles = fileUtilsInterface.listFileNames(reportingDataFile.toString()); for (String file : listFiles) { ReportingData reportingData = new ReportingData(reportingDataFile.resolve(file)); if (file.contains(".xml")) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/CsvUtils.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/CsvUtils.java index 12e220de..7a414b88 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/CsvUtils.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/CsvUtils.java @@ -17,7 +17,6 @@ /** Encapsulate org.opencsv features that we use in Kraftwerk. */ public class CsvUtils { - //TODO make it work with Minio private CsvUtils() { //Utility class } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index 7144a60a..846811b5 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -34,9 +34,7 @@ public class FileSystemImpl implements FileUtilsInterface{ - /** - * Move the input file to another directory to archive it - */ + @Override public void renameInputFile(Path inDirectory) { File file = inDirectory.resolve("kraftwerk.json").toFile(); @@ -89,7 +87,7 @@ public void deleteDirectory(Path directoryPath) throws KraftwerkException { * @return */ @Override - public List listFiles(String dir) { + public List listFileNames(String dir) { File dirFile = new File(dir); return Stream.of(new File(dir).listFiles()) diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java index b1663db6..eb3acbcd 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java @@ -13,8 +13,11 @@ import java.time.format.DateTimeFormatter; import java.util.List; +/** + * Interface to use to interact with storage + */ public interface FileUtilsInterface { - //TODO organize this + //Common methods static Path transformToOut(Path inDirectory) { return transformToOther(inDirectory, "out"); } @@ -38,71 +41,97 @@ private static Path transformToOther(Path inDirectory, String other) { : transformToOther(inDirectory.getParent(), other).resolve(inDirectory.getFileName()); } - void renameInputFile(Path inDirectory); - - void archiveInputFiles(UserInputsFile userInputsFile) throws KraftwerkException; - - void deleteDirectory(Path directoryPath) throws KraftwerkException; - - //TODO change to listFilesNames - List listFiles(String dir); - - List listFilePaths(String dir); - - Path getTempVtlFilePath(UserInputs userInputs, String step, String dataset); - - Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException; - - URL convertToUrl(String userField, Path inputDirectory); - + //Methods to implement + //File system interactions /** - * + * Read a file * @param path path of file - * @return true if directory, false if file, null if neither + * @return an InputStream of content of file */ - @Nullable - Boolean isDirectory(String path); - - /** - * - * @param path path of file - * @return size of file - */ - long getSizeOf(String path); - + InputStream readFile(String path); /** - * Write a file in the path + * Write string into a file * @param path path of the file * @param toWrite String to write * @param replace true if overwrite, false if append */ void writeFile(String path, String toWrite, boolean replace); + /** + * Move file from source to destination (depends on the file system) + * @param srcPath source path + * @param dstPath destination path + * @throws KraftwerkException + */ + void moveFile(String srcPath, String dstPath) throws KraftwerkException; + /** + * Move file from local file system to another path + * @param fileSystemPath local path + * @param dstPath destination path + * @throws KraftwerkException + */ + void moveFile(Path fileSystemPath, String dstPath) throws KraftwerkException; + /** + * Deletes a directory recursively + * @param directoryPath path of directory + * @throws KraftwerkException if exception + */ + void deleteDirectory(Path directoryPath) throws KraftwerkException; /** * Find the file in the folder of a campaign * @param directory directory where the file should be * @param fileRegex regex of the file to match - * @return Path of the DDI file + * @return Path of the file * @throws KraftwerkException if no file found */ String findFile(String directory, String fileRegex) throws KraftwerkException; - InputStream readFile(String path); + //File listing + /** + * List file names in a directory + * @param dir directory to list files from + * @return a list of file names + */ + List listFileNames(String dir); + + /** + * List file paths in a directory + * @param dir directory to list files from + * @return a list of file paths + */ + List listFilePaths(String dir); + + //Conversions + Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException; + URL convertToUrl(String userField, Path inputDirectory); + + //Checks + /** + * Check if file exists + * @param path path of file + * @return true if file exists, false otherwise + */ boolean isFileExists(String path); + /** + * Checks if path is a file or directory or neither + * @param path path of file + * @return true if directory, false if file, null if neither + */ + @Nullable + Boolean isDirectory(String path); /** - * Move file from source to destination (depends of the file system) - * @param srcPath source path - * @param dstPath destination path - * @throws KraftwerkException + * Returns the size of a file + * @param path path of file + * @return size of file */ - void moveFile(String srcPath, String dstPath) throws KraftwerkException; + long getSizeOf(String path); + //Misc. /** - * Move file from local file system to another path - * @param fileSystemPath local path - * @param dstPath destination path - * @throws KraftwerkException + * Move the input file to another directory to archive it */ - void moveFile(Path fileSystemPath, String dstPath) throws KraftwerkException; + void renameInputFile(Path inDirectory); + void archiveInputFiles(UserInputsFile userInputsFile) throws KraftwerkException; + Path getTempVtlFilePath(UserInputs userInputs, String step, String dataset); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java index 11c21032..bf444247 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -32,6 +32,7 @@ import java.util.ArrayList; import java.util.Arrays; import java.util.List; +import java.util.stream.Stream; @Slf4j @AllArgsConstructor @@ -80,7 +81,7 @@ public void archiveInputFiles(UserInputsFile userInputsFile) throws KraftwerkExc @Override public void deleteDirectory(Path directoryPath) throws KraftwerkException { try { - for (String filePath : listFiles(directoryPath.toString())) { + for (String filePath : listFileNames(directoryPath.toString())) { deleteFile(filePath); } } catch (Exception e) { @@ -89,7 +90,7 @@ public void deleteDirectory(Path directoryPath) throws KraftwerkException { } @Override - public List listFiles(String dir) { + public List listFileNames(String dir) { try { ArrayList filePaths = new ArrayList<>(); Iterable> results = minioClient.listObjects( @@ -107,7 +108,7 @@ public List listFiles(String dir) { @Override public List listFilePaths(String dir) { - return listFiles(dir); + return listFileNames(dir); } @Override @@ -180,7 +181,10 @@ public void writeFile(String path, String toWrite, boolean replace) { @Override public String findFile(String directory, String fileRegex) throws KraftwerkException { - return null; //TODO faire ça + try (Stream files = listFileNames(directory).stream().filter(s -> s.matches(fileRegex))) { + return files.findFirst() + .orElseThrow(() -> new KraftwerkException(404, "No DDI file (ddi*.xml) found in " + directory)); + } } @Override @@ -251,7 +255,7 @@ private void copyFile(String srcMinioPath, String dstMinioPath) { private void moveDirectory(String srcMinioPath, String dstMinioPath) { try { - for (String filePath : listFiles(srcMinioPath)) { + for (String filePath : listFileNames(srcMinioPath)) { moveFile(filePath, dstMinioPath + "/" + extractFileName(filePath)); } } catch (Exception e) { diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XmlSplitterTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XmlSplitterTest.java index 57fa468c..484b5e96 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XmlSplitterTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/XmlSplitterTest.java @@ -2,7 +2,6 @@ import fr.insee.kraftwerk.core.TestConstants; import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; -import fr.insee.kraftwerk.core.utils.files.FileSystemType; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.utils.xml.XmlSplitter; import org.junit.jupiter.api.BeforeAll; @@ -34,7 +33,7 @@ class XmlSplitterTest { static void cleanUpBeforeTests() throws Exception { File file = new File(outDirectory); if (file.exists()) { - List splitFiles = fileUtilsInterface.listFiles(outDirectory); + List splitFiles = fileUtilsInterface.listFileNames(outDirectory); if (splitFiles != null){ for (String splitFile : splitFiles) { if(!Files.deleteIfExists(Paths.get(outDirectory+splitFile))){ @@ -50,14 +49,14 @@ static void cleanUpBeforeTests() throws Exception { @Test @DisplayName("OutDirectory should contain 3 files") void splitInThreeTest() throws XMLStreamException, IOException { - List splitFiles = fileUtilsInterface.listFiles(outDirectory); + List splitFiles = fileUtilsInterface.listFileNames(outDirectory); assertEquals(3,splitFiles.size()); } @Test @DisplayName("File split1.xml file should contain 2 survey units") void contains2SuTest() throws XMLStreamException, IOException { - List splitFiles = fileUtilsInterface.listFiles(outDirectory); + List splitFiles = fileUtilsInterface.listFileNames(outDirectory); int count = 0; XMLInputFactory factory = XMLInputFactory.newInstance(); try { From 8a18b4d9da27b37749325000f94c4a488ed77a8c Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 24 Jun 2024 10:33:33 +0200 Subject: [PATCH 22/46] Update CHANGELOG.md --- CHANGELOG.md | 8 ++++++-- 1 file changed, 6 insertions(+), 2 deletions(-) diff --git a/CHANGELOG.md b/CHANGELOG.md index 5d592072..fbe44696 100644 --- a/CHANGELOG.md +++ b/CHANGELOG.md @@ -1,6 +1,10 @@ # Changelog -## 2.2.0 [TODO] - DuckDB implementation for output +## 3.0.0 [TODO] - Kubernetes support ### Added +- Launch treatment with command line +- S3/MinIO support : All file system calls goes through an interface with both OS file system and MinIO implementations + +- DuckDB implementation for output - Transfer Vtl datasets into DuckDB before output step - SQL util class for SQL operations @@ -10,7 +14,7 @@ ### Removed - Avro -- + ## 2.1.0 [2024-06-11] - Change Lunatic reader ### Changed - Refactor of Lunatic reader From f6e88bb091545325d9bba287b28f36c7a2e95c65 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 24 Jun 2024 11:30:52 +0200 Subject: [PATCH 23/46] Begin file interface and implementations tests --- .../core/utils/files/FileSystemImpl.java | 7 - .../core/inputs/UserInputsFileTest.java | 2 +- .../sequence/BuildBindingsSequenceTest.java | 4 +- .../core/utils/FileSystemImplTest.java | 105 ------------- .../core/utils/files/FileSystemImplTest.java | 148 ++++++++++++++++++ .../utils/files/FileSystemInterfaceTest.java | 24 +++ .../core/utils/files/MinioImplTest.java | 4 + .../unit_tests/files/list_files/file1.txt | 0 .../unit_tests/files/list_files/file2.json | 0 .../unit_tests/files/list_files/file3.xml | 0 .../files/move_files/move_files.json | 34 ++++ .../files/rename_files/kraftwerk.json | 24 +++ .../unit_tests/move_files/move_files.json | 34 ---- 13 files changed, 237 insertions(+), 149 deletions(-) delete mode 100644 kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileSystemImplTest.java create mode 100644 kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java create mode 100644 kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java create mode 100644 kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/MinioImplTest.java create mode 100644 kraftwerk-core/src/test/resources/unit_tests/files/list_files/file1.txt create mode 100644 kraftwerk-core/src/test/resources/unit_tests/files/list_files/file2.json create mode 100644 kraftwerk-core/src/test/resources/unit_tests/files/list_files/file3.xml create mode 100644 kraftwerk-core/src/test/resources/unit_tests/files/move_files/move_files.json create mode 100644 kraftwerk-core/src/test/resources/unit_tests/files/rename_files/kraftwerk.json delete mode 100644 kraftwerk-core/src/test/resources/unit_tests/move_files/move_files.json diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index 846811b5..ce8463d6 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -81,15 +81,8 @@ public void deleteDirectory(Path directoryPath) throws KraftwerkException { } } - /** - * List the file names in the directory - * @param dir - * @return - */ @Override public List listFileNames(String dir) { - File dirFile = new File(dir); - return Stream.of(new File(dir).listFiles()) .filter(file -> !file.isDirectory()) .map(File::getName) diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java index 1d4e4811..3a21e572 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java @@ -29,7 +29,7 @@ class UserInputsFileTest { @Test void testReadValidUserInput_singleMode() throws KraftwerkException { UserInputsFile userInputsFile = new UserInputsFile( - inputSamplesDirectory.resolve("inputs_valid.json"), + inputSamplesDirectory.resolve("kraftwerk.json"), inputSamplesDirectory, fileUtilsInterface); // ModeInputs modeInputs = userInputsFile.getModeInputs("CAPI"); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java index d17b2a03..e1b58487 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java @@ -30,7 +30,7 @@ class BuildBindingsSequenceTest { void buildVtlBindings_errorWithoutMetadata() throws KraftwerkException { //GIVEN UserInputsFile userInputsFile = new UserInputsFile( - inputSamplesDirectory.resolve("inputs_valid.json"), + inputSamplesDirectory.resolve("kraftwerk.json"), inputSamplesDirectory, fileUtilsInterface); String dataMode = "CAPI"; VtlBindings vtlBindings = new VtlBindings(); @@ -50,7 +50,7 @@ void buildVtlBindings_errorWithoutMetadata() throws KraftwerkException { void buildVtlBindings_success_changingDdi_and_reportingData(boolean withDdi, boolean withAllReportingData ) throws KraftwerkException { //GIVEN UserInputsFile userInputsFile = new UserInputsFile( - inputSamplesDirectory.resolve("inputs_valid.json"), + inputSamplesDirectory.resolve("kraftwerk.json"), inputSamplesDirectory, fileUtilsInterface); String dataMode = "CAPI"; VtlBindings vtlBindings = new VtlBindings(); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileSystemImplTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileSystemImplTest.java deleted file mode 100644 index baee18ad..00000000 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/FileSystemImplTest.java +++ /dev/null @@ -1,105 +0,0 @@ -package fr.insee.kraftwerk.core.utils; - -import fr.insee.kraftwerk.core.Constants; -import fr.insee.kraftwerk.core.TestConstants; -import fr.insee.kraftwerk.core.exceptions.KraftwerkException; -import fr.insee.kraftwerk.core.inputs.UserInputsFile; -import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; -import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; -import org.junit.jupiter.api.Assertions; -import org.junit.jupiter.api.BeforeAll; -import org.junit.jupiter.api.Test; - -import java.io.File; -import java.io.IOException; -import java.nio.file.Files; -import java.nio.file.Path; -import java.nio.file.Paths; -import java.time.LocalDateTime; - -import static org.junit.Assert.assertThrows; -import static org.junit.jupiter.api.Assertions.assertEquals; - -class FileSystemImplTest { - private static FileUtilsInterface fileUtilsInterface; - - @BeforeAll - static void init(){ - fileUtilsInterface = new FileSystemImpl(); - } - - - @Test - void testTransformToOut() { - assertEquals(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/out/VQS"), - FileUtilsInterface.transformToOut(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/in/VQS"))); - } - - @Test - void testTransformToOut2() { - Path path = Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/out/VQS"); - assertEquals(path, FileUtilsInterface.transformToOut(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/in/VQS"), LocalDateTime.now()).getParent()); - } - - @Test - void archiveInputFiles_failWhenNull() { - assertThrows(NullPointerException.class, () -> fileUtilsInterface.archiveInputFiles(null)); - } - - - @Test - void archiveInputFiles_ok() throws IOException, KraftwerkException{ - - //GIVEN - String campaignName = "move_files"; - Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, campaignName, "execute"); - org.springframework.util.FileSystemUtils.deleteRecursively(inputDirectory); - Files.createDirectories(inputDirectory); - Files.copy(Path.of(TestConstants.UNIT_TESTS_DIRECTORY, campaignName,"move_files.json"), - Path.of(inputDirectory.toString(),"move_files.json")); - - //WEB - Path webDirectory = Paths.get(inputDirectory.toString(), "web"); - Files.createDirectories(webDirectory); - new File(webDirectory+"/web.xml").createNewFile(); - new File(webDirectory+"/vqs-2021-x00-xforms-ddi.xml").createNewFile(); - new File(webDirectory+"/WEB.vtl").createNewFile(); - - //PAPER - Path paperDirectory = Paths.get(inputDirectory.toString(), "papier"); - Files.createDirectories(paperDirectory); - new File(paperDirectory+"/paper.txt").createNewFile(); - new File(paperDirectory+"/vqs-2021-x00-fo-ddi.xml").createNewFile(); - - //Reporting - Path reportingDirectory = Paths.get(inputDirectory.toString(), "suivi"); - Files.createDirectories(reportingDirectory); - new File(reportingDirectory+"/reportingdata.xml").createNewFile(); - - //Paradata - Path paradataDirectory = Paths.get(inputDirectory.toString(), "paradata"); - Files.createDirectories(paradataDirectory); - new File(Constants.getResourceAbsolutePath(paradataDirectory +"/L0000003.json")).createNewFile(); - new File(Constants.getResourceAbsolutePath(paradataDirectory +"/L0000004.json")).createNewFile(); - new File(Constants.getResourceAbsolutePath(paradataDirectory +"/L0000009.json")).createNewFile(); - new File(Constants.getResourceAbsolutePath(paradataDirectory +"/L0000010.json")).createNewFile(); - - UserInputsFile testUserInputsFile = new UserInputsFile(Path.of(inputDirectory.toString(), "move_files.json"),inputDirectory, fileUtilsInterface); - - - //WHEN - fileUtilsInterface.archiveInputFiles(testUserInputsFile); - - //THEN - Assertions.assertTrue(new File(inputDirectory.toString() + "/Archive/papier").exists()); - Assertions.assertTrue(new File(inputDirectory.toString() + "/Archive/web").exists()); - Assertions.assertTrue(new File(inputDirectory.toString() + "/Archive/paradata/L0000010.json").exists()); - Assertions.assertTrue(new File(inputDirectory.toString() + "/Archive/suivi/reportingdata.xml").exists()); - - //CLEAN - org.springframework.util.FileSystemUtils.deleteRecursively(inputDirectory); - } - - -} - diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java new file mode 100644 index 00000000..a93ec89c --- /dev/null +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java @@ -0,0 +1,148 @@ +package fr.insee.kraftwerk.core.utils.files; + +import fr.insee.kraftwerk.core.Constants; +import fr.insee.kraftwerk.core.TestConstants; +import fr.insee.kraftwerk.core.exceptions.KraftwerkException; +import fr.insee.kraftwerk.core.inputs.UserInputsFile; +import org.assertj.core.api.Assertions; +import org.junit.jupiter.api.Test; + +import java.io.File; +import java.io.IOException; +import java.nio.file.Files; +import java.nio.file.Path; +import java.nio.file.Paths; +import java.util.List; +import java.util.stream.Stream; + +import static org.junit.Assert.assertThrows; + +class FileSystemImplTest { + private static final FileSystemImpl fileSystemImpl = new FileSystemImpl(); + + @Test + void renameInputFileTest() throws IOException { + + //GIVEN + String campaignName = "rename_files"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY,"files", campaignName); + //backup + Files.copy(inputDirectory.resolve("kraftwerk.json"), inputDirectory.getParent().resolve("kraftwerk.json")); + + //WHEN + fileSystemImpl.renameInputFile(inputDirectory); + + //THEN + try(Stream stream = Files.list(inputDirectory).filter(path -> path.getFileName().toString().startsWith("kraftwerk-"))){ + Assertions.assertThat(stream).isNotEmpty(); + } + + //CLEAN + org.springframework.util.FileSystemUtils.deleteRecursively(inputDirectory); + Files.createDirectories(inputDirectory); + Files.move(Path.of(inputDirectory.getParent().toString(),"kraftwerk.json"),Path.of(inputDirectory.toString(),"kraftwerk.json")); + } + + @Test + void archiveInputFiles_failWhenNull() { + assertThrows(NullPointerException.class, () -> fileSystemImpl.archiveInputFiles(null)); + } + + @Test + void archiveInputFiles_ok() throws IOException, KraftwerkException { + + //GIVEN + String campaignName = "move_files"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + //backup + Files.copy(Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName,"move_files.json"), + Path.of(inputDirectory.getParent().toString(),"move_files.json")); + + //WEB + Path webDirectory = Paths.get(inputDirectory.toString(), "web"); + Files.createDirectories(webDirectory); + new File(webDirectory+"/web.xml").createNewFile(); + new File(webDirectory+"/vqs-2021-x00-xforms-ddi.xml").createNewFile(); + new File(webDirectory+"/WEB.vtl").createNewFile(); + + //PAPER + Path paperDirectory = Paths.get(inputDirectory.toString(), "papier"); + Files.createDirectories(paperDirectory); + new File(paperDirectory+"/paper.txt").createNewFile(); + new File(paperDirectory+"/vqs-2021-x00-fo-ddi.xml").createNewFile(); + + //Reporting + Path reportingDirectory = Paths.get(inputDirectory.toString(), "suivi"); + Files.createDirectories(reportingDirectory); + new File(reportingDirectory+"/reportingdata.xml").createNewFile(); + + //Paradata + Path paradataDirectory = Paths.get(inputDirectory.toString(), "paradata"); + Files.createDirectories(paradataDirectory); + new File(Constants.getResourceAbsolutePath(paradataDirectory +"/L0000003.json")).createNewFile(); + new File(Constants.getResourceAbsolutePath(paradataDirectory +"/L0000004.json")).createNewFile(); + new File(Constants.getResourceAbsolutePath(paradataDirectory +"/L0000009.json")).createNewFile(); + new File(Constants.getResourceAbsolutePath(paradataDirectory +"/L0000010.json")).createNewFile(); + + UserInputsFile testUserInputsFile = new UserInputsFile(Path.of(inputDirectory.toString(), "move_files.json"),inputDirectory, fileSystemImpl); + + + //WHEN + fileSystemImpl.archiveInputFiles(testUserInputsFile); + + //THEN + Assertions.assertThat(new File(inputDirectory + "/Archive/papier")).exists(); + Assertions.assertThat(new File(inputDirectory + "/Archive/web")).exists(); + Assertions.assertThat(new File(inputDirectory + "/Archive/paradata/L0000010.json")).exists(); + Assertions.assertThat(new File(inputDirectory + "/Archive/suivi/reportingdata.xml")).exists(); + + //CLEAN + org.springframework.util.FileSystemUtils.deleteRecursively(inputDirectory); + Files.createDirectories(inputDirectory); + Files.move(Path.of(inputDirectory.getParent().toString(),"move_files.json"),Path.of(inputDirectory.toString(),"move_files.json")); + } + + @Test + void deleteDirectoryTest() throws KraftwerkException, IOException { + //GIVEN + String campaignName = "delete_directory"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + Files.createDirectories(inputDirectory); + Files.createFile(inputDirectory.resolve("test.txt")); + + //WHEN + fileSystemImpl.deleteDirectory(inputDirectory); + + //THEN + Assertions.assertThat(new File(inputDirectory.toString())).doesNotExist(); + } + + @Test + void listFileNamesTest(){ + //GIVEN + String campaignName = "list_files"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN + List fileNames = fileSystemImpl.listFileNames(inputDirectory.toString()); + + //THEN + Assertions.assertThat(fileNames).containsExactly("file1.txt","file2.json","file3.xml"); + } + + @Test + void listFilePathsTest() { + //GIVEN + String campaignName = "list_files"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN + List filePaths = fileSystemImpl.listFilePaths(inputDirectory.toString()); + + //THEN + Assertions.assertThat(filePaths).hasSize(3); + for (String filePath : filePaths) { + Assertions.assertThat(Path.of(filePath).getFileName().toString()).containsAnyOf("file1.txt", "file2.json", "file3.xml"); + } + } +} diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java new file mode 100644 index 00000000..ad917b7a --- /dev/null +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java @@ -0,0 +1,24 @@ +package fr.insee.kraftwerk.core.utils.files; + +import org.junit.jupiter.api.Test; + +import java.nio.file.Path; +import java.nio.file.Paths; +import java.time.LocalDateTime; + +import static org.junit.jupiter.api.Assertions.assertEquals; + +class FileSystemInterfaceTest { + @Test + void testTransformToOut() { + assertEquals(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/out/VQS"), + FileUtilsInterface.transformToOut(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/in/VQS"))); + } + + @Test + void testTransformToOut2() { + Path path = Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/out/VQS"); + assertEquals(path, FileUtilsInterface.transformToOut(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/in/VQS"), LocalDateTime.now()).getParent()); + } +} + diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/MinioImplTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/MinioImplTest.java new file mode 100644 index 00000000..70aa5fd4 --- /dev/null +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/MinioImplTest.java @@ -0,0 +1,4 @@ +package fr.insee.kraftwerk.core.utils.files; + +public class MinioImplTest { +} diff --git a/kraftwerk-core/src/test/resources/unit_tests/files/list_files/file1.txt b/kraftwerk-core/src/test/resources/unit_tests/files/list_files/file1.txt new file mode 100644 index 00000000..e69de29b diff --git a/kraftwerk-core/src/test/resources/unit_tests/files/list_files/file2.json b/kraftwerk-core/src/test/resources/unit_tests/files/list_files/file2.json new file mode 100644 index 00000000..e69de29b diff --git a/kraftwerk-core/src/test/resources/unit_tests/files/list_files/file3.xml b/kraftwerk-core/src/test/resources/unit_tests/files/list_files/file3.xml new file mode 100644 index 00000000..e69de29b diff --git a/kraftwerk-core/src/test/resources/unit_tests/files/move_files/move_files.json b/kraftwerk-core/src/test/resources/unit_tests/files/move_files/move_files.json new file mode 100644 index 00000000..cbfa8755 --- /dev/null +++ b/kraftwerk-core/src/test/resources/unit_tests/files/move_files/move_files.json @@ -0,0 +1,34 @@ +{ + + "campaign": "Differential", + + "survey_data": [ + { + "data_mode": "WEB", + "data_file": "web/web.xml", + "DDI_file": "web/vqs-2021-x00-xforms-ddi.xml", + "data_format": "XFORMS", + "paradata_folder": "paradata", + "reporting_data_file": "suivi/reportingdata.xml", + "mode_specifications": "web/WEB.vtl" + }, + { + "data_mode": "PAPER", + "data_file": "papier/paper.txt", + "DDI_file": "papier/vqs-2021-x00-fo-ddi.xml", + "data_format": "PAPER", + "paradata_folder": "", + "reporting_data_file": "", + "mode_specifications": "" + } + ], + + "multimode_dataset_name": "MULTIMODE", + + "reconciliation_specifications": "", + + "transformation_specifications": "", + + "information_levels_specifications": "" + +} \ No newline at end of file diff --git a/kraftwerk-core/src/test/resources/unit_tests/files/rename_files/kraftwerk.json b/kraftwerk-core/src/test/resources/unit_tests/files/rename_files/kraftwerk.json new file mode 100644 index 00000000..802eca67 --- /dev/null +++ b/kraftwerk-core/src/test/resources/unit_tests/files/rename_files/kraftwerk.json @@ -0,0 +1,24 @@ +{ + + "survey_data": [ + { + "data_mode": "CAPI", + "data_file": "sample_files_to_get/data.xml", + "DDI_file": "sample_files_to_get/ddi.xml", + "data_format": "LUNATIC_XML", + "lunatic_file": "sample_files_to_get/lunatic.json", + "paradata_folder": "", + "reporting_data_file": "sample_files_to_get/reportingdata.xml", + "mode_specifications": "" + } + ], + + "multimode_dataset_name": "MULTIMODE", + + "reconciliation_specifications": "", + + "transformation_specifications": "", + + "information_levels_specifications": "" + +} diff --git a/kraftwerk-core/src/test/resources/unit_tests/move_files/move_files.json b/kraftwerk-core/src/test/resources/unit_tests/move_files/move_files.json deleted file mode 100644 index c1d5cbbc..00000000 --- a/kraftwerk-core/src/test/resources/unit_tests/move_files/move_files.json +++ /dev/null @@ -1,34 +0,0 @@ -{ - - "campaign": "Differential", - - "survey_data": [ - { - "data_mode": "WEB", - "data_file": "web/web.xml", - "DDI_file": "web/vqs-2021-x00-xforms-ddi.xml", - "data_format": "XFORMS", - "paradata_folder": "paradata", - "reporting_data_file": "suivi/reportingdata.xml", - "mode_specifications": "web/WEB.vtl" - }, - { - "data_mode": "PAPER", - "data_file": "papier/paper.txt", - "DDI_file": "papier/vqs-2021-x00-fo-ddi.xml", - "data_format": "PAPER", - "paradata_folder": "", - "reporting_data_file": "", - "mode_specifications": "" - } - ], - - "multimode_dataset_name": "MULTIMODE", - - "reconciliation_specifications": "", - - "transformation_specifications": "", - - "information_levels_specifications": "" - -} From 268497a8c97c8f0ef17752d64537345f0fde1042 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 24 Jun 2024 11:35:55 +0200 Subject: [PATCH 24/46] Create directories method into interface --- .../java/fr/insee/kraftwerk/core/outputs/OutputFiles.java | 2 +- .../java/fr/insee/kraftwerk/core/utils/TextFileWriter.java | 2 +- .../fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java | 5 +++-- .../kraftwerk/core/utils/files/FileUtilsInterface.java | 6 ++++++ .../java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java | 5 +++++ .../main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java | 2 +- .../kraftwerk/core/outputs/ParquetOutputFilesTest.java | 2 +- .../java/cucumber/functional_tests/MainDefinitions.java | 2 +- 8 files changed, 19 insertions(+), 7 deletions(-) diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java index 34097fd4..d3c7611b 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java @@ -48,7 +48,7 @@ protected OutputFiles(Path outDirectory, VtlBindings vtlBindings, List m /** Create output folder if doesn't exist. */ private void createOutputFolder() { - FileSystemImpl.createDirectoryIfNotExist(outputFolder); + fileUtilsInterface.createDirectoryIfNotExist(outputFolder); } /** See getOutputDatasetNames doc. */ diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java index 400317b0..67a195bc 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/TextFileWriter.java @@ -36,7 +36,7 @@ public static void writeFile(Path filePath, String fileContent, FileUtilsInterfa public static void writeErrorsFile(Path inDirectory, LocalDateTime localDateTime, List errors, FileUtilsInterface fileUtilsInterface) { Path tempOutputPath = FileUtilsInterface.transformToOut(inDirectory,localDateTime) .resolve(Constants.ERRORS_FILE_NAME); - FileSystemImpl.createDirectoryIfNotExist(tempOutputPath.getParent()); + fileUtilsInterface.createDirectoryIfNotExist(tempOutputPath.getParent()); //Write errors file if (!errors.isEmpty()) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index ce8463d6..b43f18a7 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -102,8 +102,9 @@ public Path getTempVtlFilePath(UserInputs userInputs, String step, String datase createDirectoryIfNotExist(FileUtilsInterface.transformToTemp(userInputs.getInputDirectory())); return FileUtilsInterface.transformToTemp(userInputs.getInputDirectory()).resolve(step+ dataset+".vtl"); } - - public static void createDirectoryIfNotExist(Path path) { + + @Override + public void createDirectoryIfNotExist(Path path) { try { Files.createDirectories(path); log.info(String.format("Created folder: %s", path.toFile().getAbsolutePath())); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java index eb3acbcd..ef2f1576 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java @@ -101,6 +101,12 @@ private static Path transformToOther(Path inDirectory, String other) { */ List listFilePaths(String dir); + /** + * Create parent directories of the file + * @param path path of the file + */ + void createDirectoryIfNotExist(Path path); + //Conversions Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException; URL convertToUrl(String userField, Path inputDirectory); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java index bf444247..c1a8237e 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -111,6 +111,11 @@ public List listFilePaths(String dir) { return listFileNames(dir); } + @Override + public void createDirectoryIfNotExist(Path path) { + //MinIO creates automatically the folders + } + @Override public Path getTempVtlFilePath(UserInputs userInputs, String step, String dataset) { return FileUtilsInterface.transformToTemp(userInputs.getInputDirectory()).resolve(step+ dataset+".vtl"); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java index e32055f9..6e0128e0 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/vtl/VtlExecute.java @@ -121,7 +121,7 @@ public void putVtlDataset(String filePath, String bindingName, VtlBindings bindi * @param jsonOutFile Path to write the output json file. * */ public void writeJsonDataset(String bindingName, Path jsonOutFile, VtlBindings bindings) { - FileSystemImpl.createDirectoryIfNotExist(jsonOutFile.getParent()); + fileUtilsInterface.createDirectoryIfNotExist(jsonOutFile.getParent()); //Write file if (bindings.containsKey(bindingName)) { diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java index a4b9fd82..067077f1 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/outputs/ParquetOutputFilesTest.java @@ -99,7 +99,7 @@ void writeParquetFromDatasetTest() throws KraftwerkException { // Clean the existing file // Files.deleteIfExists(outputFiles.getOutputFolder()); - FileSystemImpl.createDirectoryIfNotExist(outputFiles.getOutputFolder()); + fileUtilsInterface.createDirectoryIfNotExist(outputFiles.getOutputFolder()); Map metaModels = new HashMap<>(); MetadataModel metMod = new MetadataModel(); diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java index c2f0ec78..af4515cd 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/MainDefinitions.java @@ -370,7 +370,7 @@ void deleteDirectory(File directoryToBeDeleted) { private void writeErrorsFile(Path inDirectory,LocalDateTime localDateTime, List errors) { Path tempOutputPath = FileUtilsInterface.transformToOut(inDirectory,localDateTime).resolve(Constants.ERRORS_FILE_NAME); - FileSystemImpl.createDirectoryIfNotExist(tempOutputPath.getParent()); + new FileSystemImpl().createDirectoryIfNotExist(tempOutputPath.getParent()); // Write errors file if (!errors.isEmpty()) { From 417b9ae35e34866dbe89aa4d04ef1033b617413c Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 24 Jun 2024 14:00:44 +0200 Subject: [PATCH 25/46] File system tests + moved common methods to interface --- .../kraftwerk/core/inputs/UserInputsFile.java | 18 +- .../core/inputs/UserInputsGenesis.java | 2 +- .../core/utils/files/FileSystemImpl.java | 65 ++----- .../core/utils/files/FileUtilsInterface.java | 34 +++- .../kraftwerk/core/utils/files/MinioImpl.java | 26 --- .../core/utils/files/FileSystemImplTest.java | 161 ++++++++++++++++++ .../utils/files/FileSystemInterfaceTest.java | 40 +++++ .../unit_tests/files/convert_path/test.txt | 1 + .../unit_tests/files/read_files/test.txt | 1 + 9 files changed, 260 insertions(+), 88 deletions(-) create mode 100644 kraftwerk-core/src/test/resources/unit_tests/files/convert_path/test.txt create mode 100644 kraftwerk-core/src/test/resources/unit_tests/files/read_files/test.txt diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java index 7b4239de..c44f1055 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java @@ -45,13 +45,13 @@ private void readUserInputs() throws UnknownDataFormatException, MissingMandator String dataFolder = readField(fileNode, "data_file"); String paradataFolder = readField(fileNode, "paradata_folder"); String reportingFolder = readField(fileNode, "reporting_data_file"); - Path dataPath = (fileUtilsInterface.isFileExists(dataFolder)) ? convertToUserPath(dataFolder) : fileUtilsInterface.convertToPath(dataFolder,inputDirectory); - URL ddiFile = fileUtilsInterface.convertToUrl(readField(fileNode, "DDI_file"),inputDirectory); - Path lunaticFile = fileUtilsInterface.convertToPath(readField(fileNode, "lunatic_file"),inputDirectory); + Path dataPath = (fileUtilsInterface.isFileExists(dataFolder)) ? convertToUserPath(dataFolder) : FileUtilsInterface.convertToPath(dataFolder,inputDirectory); + URL ddiFile = FileUtilsInterface.convertToUrl(readField(fileNode, "DDI_file"),inputDirectory); + Path lunaticFile = FileUtilsInterface.convertToPath(readField(fileNode, "lunatic_file"),inputDirectory); String dataFormat = readField(fileNode, "data_format"); - Path paradataPath = (paradataFolder != null && fileUtilsInterface.isFileExists(paradataFolder)) ? convertToUserPath(paradataFolder) : fileUtilsInterface.convertToPath(paradataFolder,inputDirectory); - Path reportingDataFile = (reportingFolder != null && fileUtilsInterface.isFileExists(reportingFolder)) ? convertToUserPath(reportingFolder) : fileUtilsInterface.convertToPath(reportingFolder,inputDirectory); - Path vtlFile = fileUtilsInterface.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); + Path paradataPath = (paradataFolder != null && fileUtilsInterface.isFileExists(paradataFolder)) ? convertToUserPath(paradataFolder) : FileUtilsInterface.convertToPath(paradataFolder,inputDirectory); + Path reportingDataFile = (reportingFolder != null && fileUtilsInterface.isFileExists(reportingFolder)) ? convertToUserPath(reportingFolder) : FileUtilsInterface.convertToPath(reportingFolder,inputDirectory); + Path vtlFile = FileUtilsInterface.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); ModeInputs modeInputs = new ModeInputs(); modeInputs.setDataFile(dataPath); modeInputs.setDdiUrl(ddiFile); @@ -64,9 +64,9 @@ private void readUserInputs() throws UnknownDataFormatException, MissingMandator } // multimodeDatasetName = readField(userInputs, "multimode_dataset_name"); - vtlReconciliationFile = fileUtilsInterface.convertToPath(readField(userInputs, "reconciliation_specifications"),inputDirectory); - vtlTransformationsFile = fileUtilsInterface.convertToPath(readField(userInputs, "transformation_specifications"),inputDirectory); - vtlInformationLevelsFile = fileUtilsInterface.convertToPath(readField(userInputs, "information_levels_specifications"),inputDirectory); + vtlReconciliationFile = FileUtilsInterface.convertToPath(readField(userInputs, "reconciliation_specifications"),inputDirectory); + vtlTransformationsFile = FileUtilsInterface.convertToPath(readField(userInputs, "transformation_specifications"),inputDirectory); + vtlInformationLevelsFile = FileUtilsInterface.convertToPath(readField(userInputs, "information_levels_specifications"),inputDirectory); } catch (IOException e) { log.error("Unable to read user input file: {} , {}", userInputFile, e); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java index 8994224d..4c7a988a 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java @@ -75,7 +75,7 @@ private Path getModeVtlFile(Mode mode) throws UnknownDataFormatException, Missin String dataMode = readField(fileNode, "data_mode"); if (dataMode == null) {break;} if (dataMode.equals(mode.name())) { - return fileUtilsInterface.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); + return FileUtilsInterface.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); } } } catch (IOException e) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index b43f18a7..1f449ea0 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -113,36 +113,6 @@ public void createDirectoryIfNotExist(Path path) { } } - @Override - public Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException { - if (userField != null && !"null".equals(userField) && !userField.isEmpty()) { - Path inputPath = inputDirectory.resolve(userField); - if (!new File(inputPath.toUri()).exists()) { - throw new KraftwerkException(400, String.format("The input folder \"%s\" does not exist in \"%s\".", userField, inputDirectory)); - } - return inputPath; - } else { - return null; - } - } - - @Override - public URL convertToUrl(String userField, Path inputDirectory) { - if (userField == null) { - log.debug("null value out of method that reads DDI field (should not happen)."); - return null; - } - try { - if (userField.startsWith("http")) { - return new URI(userField).toURL(); - } - return inputDirectory.resolve(userField).toFile().toURI().toURL(); - } catch (MalformedURLException | URISyntaxException e) { - log.error("Unable to convert URL from user input: " + userField); - return null; - } - } - @Override @Nullable public Boolean isDirectory(String path) { @@ -164,7 +134,7 @@ public long getSizeOf(String path) { @Override public void writeFile(String path, String toWrite, boolean replace) { - createDirectoryIfNotExist(Path.of(path)); + createDirectoryIfNotExist(Path.of(path).getParent()); StandardOpenOption standardOpenOption = replace || !isFileExists(path) ? StandardOpenOption.CREATE : StandardOpenOption.APPEND; try { Files.write(Path.of(path), toWrite.getBytes(), standardOpenOption); @@ -177,7 +147,7 @@ public void writeFile(String path, String toWrite, boolean replace) { public String findFile(String directory, String regex) throws KraftwerkException { try (Stream files = Files.find(Path.of(directory), 1, (path, basicFileAttributes) -> path.toFile().getName().toLowerCase().matches(regex))) { return files.findFirst() - .orElseThrow(() -> new KraftwerkException(404, "No DDI file (ddi*.xml) found in " + directory)).toString(); + .orElseThrow(() -> new KraftwerkException(404, "No file (%s) found in ".formatted(regex) + directory)).toString(); }catch (IOException e){ log.error(e.toString()); return null; @@ -199,6 +169,21 @@ public boolean isFileExists(String path) { return Files.exists(Path.of(path)); } + @Override + public void moveFile(String srcPath, String dstPath) throws KraftwerkException { + try { + createDirectoryIfNotExist(Path.of(dstPath).getParent()); + Files.move(Path.of(srcPath), Path.of(dstPath), StandardCopyOption.REPLACE_EXISTING); + } catch (IOException e) { + throw new KraftwerkException(500, "Can't move file " + srcPath + " to " + dstPath); + } + } + + @Override + public void moveFile(Path fileSystemPath, String dstPath) throws KraftwerkException { + //Same than other moveFile + moveFile(fileSystemPath.toString(), dstPath); + } // Utilities @@ -217,22 +202,6 @@ private void archiveReportingData(Path inputFolder, String campaignName, ModeInp } } - @Override - public void moveFile(String srcPath, String dstPath) throws KraftwerkException { - try { - createDirectoryIfNotExist(Path.of(dstPath).getParent()); - Files.move(Path.of(srcPath), Path.of(dstPath), StandardCopyOption.REPLACE_EXISTING); - } catch (IOException e) { - throw new KraftwerkException(500, "Can't move file " + srcPath + " to " + dstPath); - } - } - - @Override - public void moveFile(Path fileSystemPath, String dstPath) throws KraftwerkException { - //Same than other moveFile - moveFile(fileSystemPath.toString(), dstPath); - } - /** * If paradata, we move the paradata folder * @param inputFolder diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java index ef2f1576..6b71dab3 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java @@ -6,7 +6,11 @@ import fr.insee.kraftwerk.core.inputs.UserInputsFile; import javax.annotation.Nullable; +import java.io.File; import java.io.InputStream; +import java.net.MalformedURLException; +import java.net.URI; +import java.net.URISyntaxException; import java.net.URL; import java.nio.file.Path; import java.time.LocalDateTime; @@ -41,6 +45,32 @@ private static Path transformToOther(Path inDirectory, String other) { : transformToOther(inDirectory.getParent(), other).resolve(inDirectory.getFileName()); } + static Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException { + if (userField != null && !"null".equals(userField) && !userField.isEmpty()) { + Path inputPath = inputDirectory.resolve(userField); + if (!new File(inputPath.toUri()).exists()) { + throw new KraftwerkException(400, String.format("The input folder \"%s\" does not exist in \"%s\".", userField, inputDirectory)); + } + return inputPath; + } else { + return null; + } + } + + static URL convertToUrl(String userField, Path inputDirectory) { + if (userField == null) { + return null; + } + try { + if (userField.startsWith("http")) { + return new URI(userField).toURL(); + } + return inputDirectory.resolve(userField).toFile().toURI().toURL(); + } catch (MalformedURLException | URISyntaxException e) { + return null; + } + } + //Methods to implement //File system interactions /** @@ -107,10 +137,6 @@ private static Path transformToOther(Path inDirectory, String other) { */ void createDirectoryIfNotExist(Path path); - //Conversions - Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException; - URL convertToUrl(String userField, Path inputDirectory); - //Checks /** * Check if file exists diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java index c1a8237e..9b795177 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -121,32 +121,6 @@ public Path getTempVtlFilePath(UserInputs userInputs, String step, String datase return FileUtilsInterface.transformToTemp(userInputs.getInputDirectory()).resolve(step+ dataset+".vtl"); } - @Override - public Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException { - if (userField != null && !"null".equals(userField) && !userField.isEmpty()) { - return inputDirectory.resolve(userField); - } else { - return null; - } - } - - @Override - public URL convertToUrl(String userField, Path inputDirectory) { - if (userField == null) { - log.debug("null value out of method that reads DDI field (should not happen)."); - return null; - } - try { - if (userField.startsWith("http")) { - return new URI(userField).toURL(); - } - return inputDirectory.resolve(userField).toFile().toURI().toURL(); - } catch (MalformedURLException | URISyntaxException e) { - log.error("Unable to convert URL from user input: " + userField); - return null; - } - } - @Override public Boolean isDirectory(String path){ try { diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java index a93ec89c..02fe2119 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java @@ -9,6 +9,7 @@ import java.io.File; import java.io.IOException; +import java.io.InputStream; import java.nio.file.Files; import java.nio.file.Path; import java.nio.file.Paths; @@ -145,4 +146,164 @@ void listFilePathsTest() { Assertions.assertThat(Path.of(filePath).getFileName().toString()).containsAnyOf("file1.txt", "file2.json", "file3.xml"); } } + + @Test + void createDirectoryTest() throws IOException { + //GIVEN + String campaignName = "create_directory"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN + fileSystemImpl.createDirectoryIfNotExist(inputDirectory); + + //THEN + Assertions.assertThat(inputDirectory.toFile()).exists().isDirectory(); + + //CLEAN + Files.deleteIfExists(inputDirectory); + } + + @Test + void isDirectoryTest(){ + //GIVEN + String campaignName = "move_files"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN + THEN + Assertions.assertThat(fileSystemImpl.isDirectory(String.valueOf(inputDirectory))).isTrue(); + Assertions.assertThat(fileSystemImpl.isDirectory(String.valueOf(inputDirectory.resolve("move_files.json")))).isFalse(); + Assertions.assertThat(fileSystemImpl.isDirectory(String.valueOf(inputDirectory.resolve("NULL.json")))).isNull(); + } + + @Test + void getSizeOfTest() throws IOException { + //GIVEN + String campaignName = "convert_path"; + Path file = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName).resolve("test.txt"); + + //WHEN + THEN + Assertions.assertThat(fileSystemImpl.getSizeOf(file.toString())).isEqualTo(Files.size(file)); + } + + @Test + void writeFileTest() throws IOException { + //GIVEN + String campaignName = "write_file"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN + fileSystemImpl.writeFile(inputDirectory.resolve("test.txt").toString(),"test",true); + + //THEN + Assertions.assertThat(new File(inputDirectory.resolve("test.txt").toString())).exists(); + Assertions.assertThat(Files.readAllBytes(inputDirectory.resolve("test.txt"))).contains("test".getBytes()); + + //CLEAN + Files.deleteIfExists(inputDirectory.resolve("test.txt")); + Files.deleteIfExists(inputDirectory); + } + + @Test + void writeFileTest_append() throws IOException { + //GIVEN + String campaignName = "write_file"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN + fileSystemImpl.writeFile(inputDirectory.resolve("test.txt").toString(),"test1",true); + fileSystemImpl.writeFile(inputDirectory.resolve("test.txt").toString(),"\ntest2",false); + + //THEN + Assertions.assertThat(new File(inputDirectory.resolve("test.txt").toString())).exists(); + Assertions.assertThat(Files.readAllBytes(inputDirectory.resolve("test.txt"))).contains("test".getBytes()).contains("test2".getBytes()); + + //CLEAN + Files.deleteIfExists(inputDirectory.resolve("test.txt")); + Files.deleteIfExists(inputDirectory); + } + @Test + void findFileTest() throws KraftwerkException { + //GIVEN + String campaignName = "list_files"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN + THEN + Assertions.assertThat(fileSystemImpl.findFile(inputDirectory.toString(), "[\\w,\\s-]+\\.xml")).isNotEmpty(); + } + + @Test + void findFileTest_notfound() throws KraftwerkException { + //GIVEN + String campaignName = "list_files"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN+THEN + assertThrows(KraftwerkException.class, () -> fileSystemImpl.findFile(inputDirectory.toString(),Constants.DDI_FILE_REGEX)); + } + + @Test + void readFileTest() throws IOException { + //GIVEN + String campaignName = "read_files"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN + THEN + try(InputStream inputStream = fileSystemImpl.readFile(inputDirectory.resolve("test.txt").toString())){ + Assertions.assertThat(inputStream).hasContent("hello !"); + } + } + + @Test + void isFileExistsTest(){ + //GIVEN + String campaignName = "read_files"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN + THEN + Assertions.assertThat(fileSystemImpl.isFileExists(inputDirectory.resolve("test.txt").toString())).isTrue(); + Assertions.assertThat(fileSystemImpl.isFileExists(inputDirectory.resolve("null.txt").toString())).isFalse(); + } + + @Test + void moveFileTest() throws KraftwerkException, IOException { + //GIVEN + String campaignName = "move_files"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + Files.copy(inputDirectory.resolve("move_files.json"),inputDirectory.resolve("test1.txt")); + + String campaignName2 = "move_files2"; + Path inputDirectory2 = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName2); + + //WHEN + fileSystemImpl.moveFile(inputDirectory.resolve("test1.txt").toString(), inputDirectory2.resolve("test2.txt").toString()); + + //THEN + Assertions.assertThat(inputDirectory2.resolve("test2.txt")).exists(); + + //CLEAN + Files.deleteIfExists(inputDirectory2.resolve("test2.txt")); + Files.deleteIfExists(inputDirectory.resolve("test1.txt")); + } + + @Test + void moveFileTest_FromPath() throws KraftwerkException, IOException { + //GIVEN + String campaignName = "move_files"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + Files.copy(inputDirectory.resolve("move_files.json"),inputDirectory.resolve("test1.txt")); + + String campaignName2 = "move_files2"; + Path inputDirectory2 = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName2); + + //WHEN + fileSystemImpl.moveFile(inputDirectory.resolve("test1.txt"), inputDirectory2.resolve("test2.txt").toString()); + + //THEN + Assertions.assertThat(inputDirectory2.resolve("test2.txt")).exists(); + + //CLEAN + Files.deleteIfExists(inputDirectory2.resolve("test2.txt")); + Files.deleteIfExists(inputDirectory.resolve("test1.txt")); + Files.deleteIfExists(inputDirectory2); + } } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java index ad917b7a..f1c2c4b4 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java @@ -1,5 +1,9 @@ package fr.insee.kraftwerk.core.utils.files; +import fr.insee.kraftwerk.core.TestConstants; +import fr.insee.kraftwerk.core.exceptions.KraftwerkException; +import org.assertj.core.api.Assertions; +import org.junit.Assert; import org.junit.jupiter.api.Test; import java.nio.file.Path; @@ -20,5 +24,41 @@ void testTransformToOut2() { Path path = Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/out/VQS"); assertEquals(path, FileUtilsInterface.transformToOut(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/in/VQS"), LocalDateTime.now()).getParent()); } + + @Test + void convertToPathTest_nullUserField() throws KraftwerkException { + Assertions.assertThat(FileUtilsInterface.convertToPath(null,null)).isNull(); + } + + @Test + void convertToPathTest_directoryNotExists(){ + Assert.assertThrows(KraftwerkException.class, () -> FileUtilsInterface.convertToPath("test", Path.of("NOT SUPPOSED TO EXIST"))); + } + + @Test + void convertToPathTest() throws KraftwerkException { + //GIVEN + String campaignName = "convert_path"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN+THEN + Assertions.assertThat(FileUtilsInterface.convertToPath("test.txt", inputDirectory)).exists(); + } + + @Test + void convertToURLTest_nullUserField(){ + Assertions.assertThat(FileUtilsInterface.convertToUrl(null,null)).isNull(); + } + + @Test + void convertToURLTest(){ + //GIVEN + String campaignName = "convert_path"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN+THEN + Assertions.assertThat(FileUtilsInterface.convertToUrl("test.txt", inputDirectory).getFile()).endsWith("test.txt"); + } + } diff --git a/kraftwerk-core/src/test/resources/unit_tests/files/convert_path/test.txt b/kraftwerk-core/src/test/resources/unit_tests/files/convert_path/test.txt new file mode 100644 index 00000000..30d74d25 --- /dev/null +++ b/kraftwerk-core/src/test/resources/unit_tests/files/convert_path/test.txt @@ -0,0 +1 @@ +test \ No newline at end of file diff --git a/kraftwerk-core/src/test/resources/unit_tests/files/read_files/test.txt b/kraftwerk-core/src/test/resources/unit_tests/files/read_files/test.txt new file mode 100644 index 00000000..84ac6f96 --- /dev/null +++ b/kraftwerk-core/src/test/resources/unit_tests/files/read_files/test.txt @@ -0,0 +1 @@ +hello ! \ No newline at end of file From 8a2c9a4b3125c364d8191781a54f29dd7b8aea8f Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Wed, 26 Jun 2024 08:39:24 +0200 Subject: [PATCH 26/46] Fixes MinIO after manual tests --- .../api/configuration/MinioConfig.java | 11 ++- .../kraftwerk/api/process/MainProcessing.java | 2 +- .../api/process/MainProcessingGenesis.java | 4 +- .../kraftwerk/core/inputs/ModeInputs.java | 3 +- .../kraftwerk/core/inputs/UserInputsFile.java | 22 +++--- .../core/inputs/UserInputsGenesis.java | 14 ++-- .../kraftwerk/core/metadata/DDIReader.java | 27 +++---- .../core/metadata/LunaticReader.java | 27 ++++--- .../core/metadata/MetadataUtils.java | 14 ++-- .../core/metadata/MetadataUtilsGenesis.java | 12 +-- .../kraftwerk/core/outputs/OutputFiles.java | 3 +- .../core/parsers/LunaticXmlDataParser.java | 2 +- .../BuildBindingsSequenceGenesis.java | 5 +- .../core/sequence/ControlInputSequence.java | 3 +- .../core/sequence/UnimodalSequence.java | 2 +- .../{JsonFileReader.java => JsonReader.java} | 12 ++- .../core/utils/files/FileSystemImpl.java | 28 +++++++ .../core/utils/files/FileUtilsInterface.java | 38 ++------- .../kraftwerk/core/utils/files/MinioImpl.java | 79 +++++++++++++------ .../core/utils/xsl/SaxonTransformer.java | 30 +++---- .../core/inputs/UserInputsFileTest.java | 2 +- .../core/metadata/DDIReaderTest.java | 8 +- .../core/metadata/LunaticReaderTest.java | 9 ++- .../kraftwerk/core/metadata/VariableTest.java | 8 +- .../sequence/BuildBindingsSequenceTest.java | 4 +- .../core/utils/files/FileSystemImplTest.java | 38 +++++++++ .../utils/files/FileSystemInterfaceTest.java | 35 -------- .../core/utils/files/MinioImplTest.java | 4 - .../core/utils/xsl/SaxonTransformerTest.java | 2 +- .../CalculatedProcessingDefinition.java | 4 +- .../DDIGetterDefinitions.java | 4 +- .../VariablesGetterDefinitions.java | 2 +- 32 files changed, 245 insertions(+), 213 deletions(-) rename kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/{JsonFileReader.java => JsonReader.java} (54%) delete mode 100644 kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/MinioImplTest.java diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/configuration/MinioConfig.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/configuration/MinioConfig.java index 1bd8e6b2..4f20355a 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/configuration/MinioConfig.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/configuration/MinioConfig.java @@ -1,15 +1,24 @@ package fr.insee.kraftwerk.api.configuration; import lombok.Getter; +import org.springframework.beans.factory.annotation.Value; import org.springframework.boot.context.properties.ConfigurationProperties; -@ConfigurationProperties(prefix = "fr.insee.postcollecte.minio") +@ConfigurationProperties @Getter public class MinioConfig { + @Value("${fr.insee.postcollecte.minio.endpoint}") private String endpoint; + + @Value("${fr.insee.postcollecte.minio.access_key}") private String accessKey; + + @Value("${fr.insee.postcollecte.minio.secret_key}") private String secretKey; + + @Value("${fr.insee.postcollecte.minio.enable}") private boolean enable; + @Value("${fr.insee.postcollecte.minio.bucket_name}") private String bucketName; } diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java index a2fda208..547cecd1 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessing.java @@ -117,7 +117,7 @@ public void init() throws KraftwerkException { userInputsFile = controlInputSequence.getUserInputs(inDirectory, fileUtilsInterface); - metadataModels = withDDI ? MetadataUtils.getMetadata(userInputsFile.getModeInputsMap(), fileUtilsInterface) : MetadataUtils.getMetadataFromLunatic(userInputsFile.getModeInputsMap()); + metadataModels = withDDI ? MetadataUtils.getMetadata(userInputsFile.getModeInputsMap(), fileUtilsInterface) : MetadataUtils.getMetadataFromLunatic(userInputsFile.getModeInputsMap(), fileUtilsInterface); userInputsFileList = getUserInputsFile(userInputsFile, fileByFile); diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java index 99b60723..6ccc94d7 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java @@ -23,7 +23,6 @@ import lombok.extern.log4j.Log4j2; import org.apache.commons.collections4.ListUtils; import org.springframework.boot.web.client.RestTemplateBuilder; -import org.springframework.stereotype.Component; import java.io.IOException; import java.nio.file.Path; @@ -35,7 +34,6 @@ import java.util.Map; @Log4j2 -@Component public class MainProcessingGenesis { @Setter @@ -112,7 +110,7 @@ public void runMain(String idCampaign) throws KraftwerkException, IOException { private void unimodalProcess(List suLatest) throws KraftwerkException { BuildBindingsSequenceGenesis buildBindingsSequenceGenesis = new BuildBindingsSequenceGenesis(fileUtilsInterface); for (String dataMode : userInputs.getModeInputsMap().keySet()) { - buildBindingsSequenceGenesis.buildVtlBindings(dataMode, vtlBindings, metadataModels, suLatest, inDirectory, database); + buildBindingsSequenceGenesis.buildVtlBindings(dataMode, vtlBindings, metadataModels, suLatest, inDirectory); UnimodalSequence unimodal = new UnimodalSequence(); unimodal.applyUnimodalSequence(userInputs, dataMode, vtlBindings, errors, metadataModels, fileUtilsInterface); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/ModeInputs.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/ModeInputs.java index 0f79cfbd..eb88e596 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/ModeInputs.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/ModeInputs.java @@ -5,7 +5,6 @@ import lombok.Getter; import lombok.Setter; -import java.net.URL; import java.nio.file.Path; /** @@ -16,7 +15,7 @@ public class ModeInputs { protected Path dataFile; - protected URL ddiUrl; + protected String ddiUrl; protected Path lunaticFile; protected DataFormat dataFormat; protected String dataMode; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java index c44f1055..1384dd87 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsFile.java @@ -5,7 +5,7 @@ import fr.insee.kraftwerk.core.exceptions.MissingMandatoryFieldException; import fr.insee.kraftwerk.core.exceptions.UnknownDataFormatException; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; -import fr.insee.kraftwerk.core.utils.JsonFileReader; +import fr.insee.kraftwerk.core.utils.JsonReader; import lombok.Getter; import lombok.Setter; import lombok.extern.log4j.Log4j2; @@ -36,7 +36,7 @@ public UserInputsFile(Path userConfigFile, Path inputDirectory, FileUtilsInterfa private void readUserInputs() throws UnknownDataFormatException, MissingMandatoryFieldException, KraftwerkException { try { - JsonNode userInputs = JsonFileReader.read(userInputFile); + JsonNode userInputs = JsonReader.read(userInputFile,fileUtilsInterface); // JsonNode filesNode = userInputs.get("survey_data"); for (JsonNode fileNode : filesNode) { @@ -45,13 +45,13 @@ private void readUserInputs() throws UnknownDataFormatException, MissingMandator String dataFolder = readField(fileNode, "data_file"); String paradataFolder = readField(fileNode, "paradata_folder"); String reportingFolder = readField(fileNode, "reporting_data_file"); - Path dataPath = (fileUtilsInterface.isFileExists(dataFolder)) ? convertToUserPath(dataFolder) : FileUtilsInterface.convertToPath(dataFolder,inputDirectory); - URL ddiFile = FileUtilsInterface.convertToUrl(readField(fileNode, "DDI_file"),inputDirectory); - Path lunaticFile = FileUtilsInterface.convertToPath(readField(fileNode, "lunatic_file"),inputDirectory); + Path dataPath = (fileUtilsInterface.isFileExists(dataFolder)) ? convertToUserPath(dataFolder) : fileUtilsInterface.convertToPath(dataFolder,inputDirectory); + String ddiFile = fileUtilsInterface.convertToUrl(readField(fileNode, "DDI_file"),inputDirectory); + Path lunaticFile = fileUtilsInterface.convertToPath(readField(fileNode, "lunatic_file"),inputDirectory); String dataFormat = readField(fileNode, "data_format"); - Path paradataPath = (paradataFolder != null && fileUtilsInterface.isFileExists(paradataFolder)) ? convertToUserPath(paradataFolder) : FileUtilsInterface.convertToPath(paradataFolder,inputDirectory); - Path reportingDataFile = (reportingFolder != null && fileUtilsInterface.isFileExists(reportingFolder)) ? convertToUserPath(reportingFolder) : FileUtilsInterface.convertToPath(reportingFolder,inputDirectory); - Path vtlFile = FileUtilsInterface.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); + Path paradataPath = (paradataFolder != null && fileUtilsInterface.isFileExists(paradataFolder)) ? convertToUserPath(paradataFolder) : fileUtilsInterface.convertToPath(paradataFolder,inputDirectory); + Path reportingDataFile = (reportingFolder != null && fileUtilsInterface.isFileExists(reportingFolder)) ? convertToUserPath(reportingFolder) : fileUtilsInterface.convertToPath(reportingFolder,inputDirectory); + Path vtlFile = fileUtilsInterface.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); ModeInputs modeInputs = new ModeInputs(); modeInputs.setDataFile(dataPath); modeInputs.setDdiUrl(ddiFile); @@ -64,9 +64,9 @@ private void readUserInputs() throws UnknownDataFormatException, MissingMandator } // multimodeDatasetName = readField(userInputs, "multimode_dataset_name"); - vtlReconciliationFile = FileUtilsInterface.convertToPath(readField(userInputs, "reconciliation_specifications"),inputDirectory); - vtlTransformationsFile = FileUtilsInterface.convertToPath(readField(userInputs, "transformation_specifications"),inputDirectory); - vtlInformationLevelsFile = FileUtilsInterface.convertToPath(readField(userInputs, "information_levels_specifications"),inputDirectory); + vtlReconciliationFile = fileUtilsInterface.convertToPath(readField(userInputs, "reconciliation_specifications"),inputDirectory); + vtlTransformationsFile = fileUtilsInterface.convertToPath(readField(userInputs, "transformation_specifications"),inputDirectory); + vtlInformationLevelsFile = fileUtilsInterface.convertToPath(readField(userInputs, "information_levels_specifications"),inputDirectory); } catch (IOException e) { log.error("Unable to read user input file: {} , {}", userInputFile, e); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java index 4c7a988a..6815c205 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java @@ -7,15 +7,13 @@ import fr.insee.kraftwerk.core.exceptions.MissingMandatoryFieldException; import fr.insee.kraftwerk.core.exceptions.UnknownDataFormatException; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; -import fr.insee.kraftwerk.core.utils.JsonFileReader; +import fr.insee.kraftwerk.core.utils.JsonReader; import lombok.extern.log4j.Log4j2; import java.io.IOException; -import java.nio.file.Files; import java.nio.file.Path; import java.util.ArrayList; import java.util.List; -import java.util.stream.Stream; @Log4j2 public class UserInputsGenesis extends UserInputs{ @@ -31,7 +29,7 @@ public UserInputsGenesis(boolean hasConfigFile, Path inputDirectory, List computeInputs(); } - private void computeInputs() throws KraftwerkException, IOException { + private void computeInputs() throws KraftwerkException { UserInputsFile userInputsFile; if(hasConfigFile){ userInputsFile = new UserInputsFile(inputDirectory.resolve(Constants.USER_INPUT_FILE), inputDirectory, fileUtilsInterface); @@ -49,9 +47,9 @@ private void computeInputs() throws KraftwerkException, IOException { * @param mode mode to get inputs from * @return a ModeInputs object */ - private ModeInputs getModeInputs(Mode mode) throws KraftwerkException, IOException { + private ModeInputs getModeInputs(Mode mode) throws KraftwerkException { ModeInputs modeInputs = new ModeInputs(); - modeInputs.setDdiUrl(findDDIFile(inputDirectory.resolve(mode.name())).toFile().toURI().toURL()); + modeInputs.setDdiUrl(findDDIFile(inputDirectory.resolve(mode.name())).toString()); modeInputs.setLunaticFile(findLunaticFile(inputDirectory.resolve(mode.name()))); modeInputs.setDataMode(mode.name()); if (mode == Mode.WEB || mode == Mode.TEL || mode == Mode.F2F) { @@ -69,13 +67,13 @@ private ModeInputs getModeInputs(Mode mode) throws KraftwerkException, IOExcepti private Path getModeVtlFile(Mode mode) throws UnknownDataFormatException, MissingMandatoryFieldException, KraftwerkException { Path userInputFile = inputDirectory.resolve(Constants.USER_INPUT_FILE); try { - JsonNode userInputs = JsonFileReader.read(userInputFile); + JsonNode userInputs = JsonReader.read(userInputFile, fileUtilsInterface); JsonNode filesNode = userInputs.get("survey_data"); for (JsonNode fileNode : filesNode) { String dataMode = readField(fileNode, "data_mode"); if (dataMode == null) {break;} if (dataMode.equals(mode.name())) { - return FileUtilsInterface.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); + return fileUtilsInterface.convertToPath(readField(fileNode, "mode_specifications"),inputDirectory); } } } catch (IOException e) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java index 897df7c3..c4933525 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java @@ -20,7 +20,6 @@ import java.io.IOException; import java.io.InputStream; import java.net.MalformedURLException; -import java.net.URL; import java.nio.file.Files; import java.nio.file.Path; import java.util.List; @@ -40,12 +39,12 @@ private DDIReader() { * written in the system temporary folder with the name 'variables.xml'. This file is * deleted after being used or when the virtual machine terminates. * - * @param ddiUrl : Path to the DDI file. + * @param ddiUrlString : Path to the DDI file. * * @return The variables found in the DDI. * @throws KraftwerkException */ - public static MetadataModel getMetadataFromDDI(URL ddiUrl, FileUtilsInterface fileUtilsInterface) throws KraftwerkException { + public static MetadataModel getMetadataFromDDI(String ddiUrlString, FileUtilsInterface fileUtilsInterface) throws KraftwerkException { try { // Path of the output 'variables.xml' temp file @@ -53,15 +52,15 @@ public static MetadataModel getMetadataFromDDI(URL ddiUrl, FileUtilsInterface fi variablesFile.deleteOnExit(); Path variablesTempFilePath = variablesFile.toPath(); - transformDDI(ddiUrl, variablesTempFilePath); + transformDDI(ddiUrlString, variablesTempFilePath, fileUtilsInterface); - MetadataModel metadataModel = readVariables(variablesTempFilePath, fileUtilsInterface); + MetadataModel metadataModel = readVariables(variablesTempFilePath); Files.delete(variablesFile.toPath()); return metadataModel; } catch (MalformedURLException e) { - log.error(String.format("Error when converting file path '%s' to an URL.", ddiUrl), e); + log.error(String.format("Error when converting file path '%s' to an URL.", ddiUrlString), e); return null; } catch (IOException e) { log.error("Unable to write temp file.", e); @@ -75,12 +74,12 @@ public static MetadataModel getMetadataFromDDI(URL ddiUrl, FileUtilsInterface fi /** * Apply the XSLT_STRUCTURED_VARIABLES transformation. * - * @param ddiUrl : URL of the DDI file. + * @param ddiUrlString : URL of the DDI file. * @param variablesFilePath : Path of the 'variables.xml' file to be generated. */ - private static void transformDDI(URL ddiUrl, Path variablesFilePath) { - SaxonTransformer saxonTransformer = new SaxonTransformer(); - saxonTransformer.xslTransform(ddiUrl, Constants.XSLT_STRUCTURED_VARIABLES, variablesFilePath); + private static void transformDDI(String ddiUrlString, Path variablesFilePath, FileUtilsInterface fileUtilsInterface) { + SaxonTransformer saxonTransformer = new SaxonTransformer(fileUtilsInterface); + saxonTransformer.xslTransform(ddiUrlString, Constants.XSLT_STRUCTURED_VARIABLES, variablesFilePath); } /** @@ -94,12 +93,12 @@ private static void transformDDI(URL ddiUrl, Path variablesFilePath) { * @throws SAXException * @throws ParserConfigurationException */ - private static MetadataModel readVariables(Path variablesFilePath, FileUtilsInterface fileUtilsInterface) + private static MetadataModel readVariables(Path variablesFilePath) throws KraftwerkException, SAXException, IOException, ParserConfigurationException { MetadataModel metadataModel = new MetadataModel(); // Parse - Element root = readXmlFile(variablesFilePath, fileUtilsInterface); + Element root = readXmlFile(variablesFilePath); // Get XML groups NodeList groupElements = root.getChildNodes(); @@ -232,7 +231,7 @@ private static void addValues(UcqVariable variable, NodeList valueElements) { private static boolean nodeIsElementWithName(Node groupNode, String name) { return name.equals(groupNode.getNodeName()) && groupNode.getNodeType() == Node.ELEMENT_NODE; } - private static Element readXmlFile(Path variablesFilePath, FileUtilsInterface fileUtilsInterface) + private static Element readXmlFile(Path variablesFilePath) throws ParserConfigurationException, SAXException, IOException, KraftwerkException { System.setProperty("javax.xml.parsers.DocumentBuilderFactory", "com.sun.org.apache.xerces.internal.jaxp.DocumentBuilderFactoryImpl"); @@ -241,7 +240,7 @@ private static Element readXmlFile(Path variablesFilePath, FileUtilsInterface fi factory.setAttribute(XMLConstants.ACCESS_EXTERNAL_DTD, ""); factory.setAttribute(XMLConstants.ACCESS_EXTERNAL_SCHEMA, ""); DocumentBuilder builder = factory.newDocumentBuilder(); - try(InputStream inputStream = fileUtilsInterface.readFile(variablesFilePath.toString())){ + try(InputStream inputStream = Files.newInputStream(variablesFilePath)){ Document document = builder.parse(inputStream); if (document == null) throw new KraftwerkException(500, "Can't read DDI - DDI is null"); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/LunaticReader.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/LunaticReader.java index 142de0f2..52051f96 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/LunaticReader.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/LunaticReader.java @@ -3,7 +3,8 @@ import com.fasterxml.jackson.databind.JsonNode; import fr.insee.kraftwerk.core.Constants; import fr.insee.kraftwerk.core.metadata.CalculatedVariables.CalculatedVariable; -import fr.insee.kraftwerk.core.utils.JsonFileReader; +import fr.insee.kraftwerk.core.utils.JsonReader; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import lombok.extern.log4j.Log4j2; import java.io.IOException; @@ -38,9 +39,9 @@ private LunaticReader() { * @param lunaticFile Path to a lunatic questionnaire file. * @return A CalculatedVariables map. */ - public static CalculatedVariables getCalculatedFromLunatic(Path lunaticFile) { + public static CalculatedVariables getCalculatedFromLunatic(Path lunaticFile, FileUtilsInterface fileUtilsInterface) { try { - JsonNode rootNode = JsonFileReader.read(lunaticFile); + JsonNode rootNode = JsonReader.read(lunaticFile, fileUtilsInterface); String lunaticModelVersion = rootNode.get(LUNATIC_MODEL_VERSION).asText(); boolean isLunaticV2 = compareVersions(lunaticModelVersion, "2.3.0") > 0; @@ -76,9 +77,9 @@ public static CalculatedVariables getCalculatedFromLunatic(Path lunaticFile) { * @param lunaticFile Path to a lunatic questionnaire file. * @return A List of String. */ - public static List getMissingVariablesFromLunatic(Path lunaticFile) { + public static List getMissingVariablesFromLunatic(Path lunaticFile, FileUtilsInterface fileUtilsInterface) { try { - JsonNode rootNode = JsonFileReader.read(lunaticFile); + JsonNode rootNode = JsonReader.read(lunaticFile, fileUtilsInterface); List variables = new ArrayList<>(); List varsEno = Arrays.asList(Constants.getEnoVariables()); @@ -100,9 +101,9 @@ public static List getMissingVariablesFromLunatic(Path lunaticFile) { * @param lunaticFile Path to a lunatic questionnaire file. * @return A List of String. */ - public static List getFilterResultFromLunatic(Path lunaticFile) { + public static List getFilterResultFromLunatic(Path lunaticFile, FileUtilsInterface fileUtilsInterface) { try { - JsonNode rootNode = JsonFileReader.read(lunaticFile); + JsonNode rootNode = JsonReader.read(lunaticFile, fileUtilsInterface); List variables = new ArrayList<>(); JsonNode variablesNode = rootNode.get(VARIABLES); @@ -115,9 +116,9 @@ public static List getFilterResultFromLunatic(Path lunaticFile) { } } - public static String getLunaticModelVersion(Path lunaticFile){ + public static String getLunaticModelVersion(Path lunaticFile, FileUtilsInterface fileUtilsInterface){ try { - JsonNode rootNode = JsonFileReader.read(lunaticFile); + JsonNode rootNode = JsonReader.read(lunaticFile, fileUtilsInterface); return rootNode.get(LUNATIC_MODEL_VERSION).toString(); } catch (IOException e) { @@ -133,10 +134,10 @@ public static String getLunaticModelVersion(Path lunaticFile){ * @param lunaticFile : Path to a Lunatic specification file. * @return The variables found in the Lunatic specification. */ - public static MetadataModel getMetadataFromLunatic(Path lunaticFile) { + public static MetadataModel getMetadataFromLunatic(Path lunaticFile, FileUtilsInterface fileUtilsInterface) { JsonNode rootNode; try { - rootNode = JsonFileReader.read(lunaticFile); + rootNode = JsonReader.read(lunaticFile, fileUtilsInterface); List variables = new ArrayList<>(); JsonNode variablesNode = rootNode.get(VARIABLES); variablesNode.forEach(newVar -> variables.add(newVar.get("name").asText())); @@ -405,10 +406,10 @@ private static Group getNewGroup(MetadataModel metadataModel, String newName, Gr * @param lunaticFile : Path to a Lunatic specification file. * @return the questionnaire model id */ - public static String getQuestionnaireModelId(Path lunaticFile) { + public static String getQuestionnaireModelId(Path lunaticFile, FileUtilsInterface fileUtilsInterface) { JsonNode rootNode; try { - rootNode = JsonFileReader.read(lunaticFile); + rootNode = JsonReader.read(lunaticFile, fileUtilsInterface); return rootNode.get("id").asText(); } catch (IOException e) { log.error(EXCEPTION_MESSAGE + lunaticFile); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtils.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtils.java index 09c0f8b5..34cd633a 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtils.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtils.java @@ -34,14 +34,14 @@ private static void putToMetadataModels(String dataMode, ModeInputs modeInputs, // Step 2 : we add the variables that are only present in the Lunatic file if (modeInputs.getLunaticFile() != null) { // We read and store lunaticModelVersion - metadataModel.putSpecVersions(SpecType.LUNATIC,LunaticReader.getLunaticModelVersion(modeInputs.getLunaticFile())); + metadataModel.putSpecVersions(SpecType.LUNATIC,LunaticReader.getLunaticModelVersion(modeInputs.getLunaticFile(), fileUtilsInterface)); // First we add the collected _MISSING variables - List missingVars = LunaticReader.getMissingVariablesFromLunatic(modeInputs.getLunaticFile()); + List missingVars = LunaticReader.getMissingVariablesFromLunatic(modeInputs.getLunaticFile(), fileUtilsInterface); for (String missingVar : missingVars) { addLunaticVariable(metadataModel, missingVar, Constants.MISSING_SUFFIX, VariableType.STRING); } // Then we add calculated FILTER_RESULT_ variables - List filterResults = LunaticReader.getFilterResultFromLunatic(modeInputs.getLunaticFile()); + List filterResults = LunaticReader.getFilterResultFromLunatic(modeInputs.getLunaticFile(), fileUtilsInterface); for (String filterResult : filterResults) { addLunaticVariable(metadataModel, filterResult, Constants.FILTER_RESULT_PREFIX, VariableType.BOOLEAN); } @@ -78,14 +78,14 @@ public static void addLunaticVariable(MetadataModel metadata, String missingVar, metadata.getVariables().putVariable(new Variable(missingVar, group, varType)); } - public static Map getMetadataFromLunatic(Map modeInputsMap) { + public static Map getMetadataFromLunatic(Map modeInputsMap, FileUtilsInterface fileUtilsInterface) { Map metadataModels = new LinkedHashMap<>(); - modeInputsMap.forEach((k, v) -> putToMetadataVariableFromLunatic(k,v,metadataModels)); + modeInputsMap.forEach((k, v) -> putToMetadataVariableFromLunatic(k,v,metadataModels, fileUtilsInterface)); return metadataModels; } - private static void putToMetadataVariableFromLunatic(String dataMode, ModeInputs modeInputs, Map metadataModels ) { - MetadataModel metadataModel = LunaticReader.getMetadataFromLunatic(modeInputs.getLunaticFile()); + private static void putToMetadataVariableFromLunatic(String dataMode, ModeInputs modeInputs, Map metadataModels, FileUtilsInterface fileUtilsInterface) { + MetadataModel metadataModel = LunaticReader.getMetadataFromLunatic(modeInputs.getLunaticFile(), fileUtilsInterface); // We add the variables for pairwise links if (metadataModel.getVariables().getVariable(Constants.LIENS) != null) { // We identify the group containing the individuals diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtilsGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtilsGenesis.java index e6be34bc..5279a71d 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtilsGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/MetadataUtilsGenesis.java @@ -34,12 +34,12 @@ private static void putToMetadataVariable(String dataMode, ModeInputs modeInputs // Step 2 : we add the variables that are only present in the Lunatic file if (modeInputsGenesis.getLunaticFile() != null) { // First we add the collected _MISSING variables - List missingVars = LunaticReader.getMissingVariablesFromLunatic(modeInputsGenesis.getLunaticFile()); + List missingVars = LunaticReader.getMissingVariablesFromLunatic(modeInputsGenesis.getLunaticFile(), fileUtilsInterface); for (String missingVar : missingVars) { addLunaticVariable(metadataModel, missingVar, Constants.MISSING_SUFFIX, VariableType.STRING); } // Then we add calculated FILTER_RESULT_ variables - List filterResults = LunaticReader.getFilterResultFromLunatic(modeInputsGenesis.getLunaticFile()); + List filterResults = LunaticReader.getFilterResultFromLunatic(modeInputsGenesis.getLunaticFile(), fileUtilsInterface); for (String filterResult : filterResults) { addLunaticVariable(metadataModel, filterResult, Constants.FILTER_RESULT_PREFIX, VariableType.BOOLEAN); } @@ -66,14 +66,14 @@ public static void addLunaticVariable(MetadataModel metadataModel, String missin metadataModel.getVariables().putVariable(new Variable(missingVar, group, varType)); } - public static Map getMetadataFromLunatic(Map modeInputsMap) { + public static Map getMetadataFromLunatic(Map modeInputsMap, FileUtilsInterface fileUtilsInterface) { Map metadataModels = new LinkedHashMap<>(); - modeInputsMap.forEach((k, v) -> putToMetadataVariableFromLunatic(k,v,metadataModels)); + modeInputsMap.forEach((k, v) -> putToMetadataVariableFromLunatic(k,v,metadataModels, fileUtilsInterface)); return metadataModels; } - private static void putToMetadataVariableFromLunatic(String dataMode, ModeInputs modeInputs, Map metadataModels ) { - MetadataModel metadataModel = LunaticReader.getMetadataFromLunatic(modeInputs.getLunaticFile()); + private static void putToMetadataVariableFromLunatic(String dataMode, ModeInputs modeInputs, Map metadataModels, FileUtilsInterface fileUtilsInterface) { + MetadataModel metadataModel = LunaticReader.getMetadataFromLunatic(modeInputs.getLunaticFile(), fileUtilsInterface); metadataModels.put(dataMode, metadataModel); } } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java index d3c7611b..6dab0a5d 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java @@ -4,7 +4,6 @@ import fr.insee.kraftwerk.core.KraftwerkError; import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.metadata.MetadataModel; -import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import fr.insee.kraftwerk.core.vtl.VtlBindings; import lombok.Getter; @@ -41,9 +40,9 @@ protected OutputFiles(Path outDirectory, VtlBindings vtlBindings, List m this.vtlBindings = vtlBindings; setOutputDatasetNames(modes); outputFolder = outDirectory; - createOutputFolder(); this.database = database; this.fileUtilsInterface = fileUtilsInterface; + createOutputFolder(); } /** Create output folder if doesn't exist. */ diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java index b325748e..a7cea016 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/parsers/LunaticXmlDataParser.java @@ -62,7 +62,7 @@ private void parseDataFile(Path filePath, Path lunaticFile) { .getChildElements("SurveyUnit"); String questionnaireModelId = null; if (lunaticFile != null) { - questionnaireModelId = LunaticReader.getQuestionnaireModelId(lunaticFile); + questionnaireModelId = LunaticReader.getQuestionnaireModelId(lunaticFile, fileUtilsInterface); } for (int i = 0; i < questionnaireNodeList.size(); i++) { diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java index 7365372d..f473f490 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceGenesis.java @@ -21,7 +21,6 @@ import fr.insee.kraftwerk.core.vtl.VtlExecute; import java.nio.file.Path; -import java.sql.Statement; import java.util.List; import java.util.Map; @@ -35,7 +34,7 @@ public BuildBindingsSequenceGenesis(FileUtilsInterface fileUtilsInterface) { this.fileUtilsInterface = fileUtilsInterface; } - public void buildVtlBindings(String dataMode, VtlBindings vtlBindings, Map metadataModels, List surveyUnits, Path inDirectory, Statement database) throws KraftwerkException, NullException { + public void buildVtlBindings(String dataMode, VtlBindings vtlBindings, Map metadataModels, List surveyUnits, Path inDirectory) throws KraftwerkException { SurveyRawData data = new SurveyRawData(); /* Step 2.0 : Read the DDI file (and Lunatic Json for missing variables) to get survey variables */ @@ -91,7 +90,7 @@ private void parseParadata(String dataMode, SurveyRawData data, Path inDirectory } } - private void parseReportingData(String dataMode, SurveyRawData data, Path inDirectory, FileUtilsInterface fileUtilsInterface) throws KraftwerkException, NullException { + private void parseReportingData(String dataMode, SurveyRawData data, Path inDirectory, FileUtilsInterface fileUtilsInterface) throws KraftwerkException { Path reportingDataFile = inDirectory.resolve(dataMode+Constants.REPORTING_DATA_FOLDER); if (fileUtilsInterface.isFileExists(reportingDataFile.toString())) { List listFiles = fileUtilsInterface.listFileNames(reportingDataFile.toString()); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java index 37877da8..f0e51ab8 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequence.java @@ -1,6 +1,5 @@ package fr.insee.kraftwerk.core.sequence; -import java.nio.file.Files; import java.nio.file.Path; import java.nio.file.Paths; @@ -27,7 +26,7 @@ public UserInputsFile getUserInputs(Path inDirectory, FileUtilsInterface fileUti } public Path getInDirectory(String inDirectoryParam) throws KraftwerkException { - Path inDirectory = Paths.get(inDirectoryParam); + Path inDirectory = Path.of(inDirectoryParam); if (!verifyInDirectory(inDirectory)) inDirectory = Paths.get(defaultDirectory, "in", inDirectoryParam); if (!verifyInDirectory(inDirectory)) throw new KraftwerkException(400, "Configuration file not found"); return inDirectory; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java index 030ed60b..330e22b7 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/UnimodalSequence.java @@ -41,7 +41,7 @@ public void applyUnimodalSequence(UserInputs userInputs, String dataMode, VtlBin /* Step 2.4b : Apply VTL expression for calculated variables (if any) */ if (modeInputs.getLunaticFile() != null) { CalculatedVariables calculatedVariables = LunaticReader - .getCalculatedFromLunatic(modeInputs.getLunaticFile()); + .getCalculatedFromLunatic(modeInputs.getLunaticFile(), fileUtilsInterface); CalculatedProcessing calculatedProcessing = new CalculatedProcessing(vtlBindings, calculatedVariables, fileUtilsInterface); vtlGenerate = calculatedProcessing.applyCalculatedVtlTransformations(dataMode, modeInputs.getModeVtlFile(), errors); TextFileWriter.writeFile(fileUtilsInterface.getTempVtlFilePath(userInputs, "CalculatedProcessing", dataMode), diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/JsonFileReader.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/JsonReader.java similarity index 54% rename from kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/JsonFileReader.java rename to kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/JsonReader.java index 684994a6..b3e77027 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/JsonFileReader.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/JsonReader.java @@ -1,14 +1,16 @@ package fr.insee.kraftwerk.core.utils; import java.io.IOException; +import java.io.InputStream; import java.nio.file.Path; import com.fasterxml.jackson.databind.JsonNode; import com.fasterxml.jackson.databind.ObjectMapper; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; -public class JsonFileReader { +public class JsonReader { - private JsonFileReader(){ + private JsonReader(){ throw new IllegalStateException("Utility class"); } @@ -19,9 +21,11 @@ private JsonFileReader(){ * * @return A jackson.databind.JsonNode. */ - public static JsonNode read(Path filePath) throws IOException { + public static JsonNode read(Path filePath, FileUtilsInterface fileUtilsInterface) throws IOException { ObjectMapper mapper = new ObjectMapper(); - return mapper.readTree(filePath.toFile()); + try (InputStream inputStream = fileUtilsInterface.readFile(filePath.toString())){ + return mapper.readTree(inputStream); + } } } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index 1f449ea0..6cb281cb 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -185,6 +185,34 @@ public void moveFile(Path fileSystemPath, String dstPath) throws KraftwerkExcept moveFile(fileSystemPath.toString(), dstPath); } + @Override + public Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException { + if (userField != null && !"null".equals(userField) && !userField.isEmpty()) { + Path inputPath = inputDirectory.resolve(userField); + if (!new File(inputPath.toUri()).exists()) { + throw new KraftwerkException(400, String.format("The input folder \"%s\" does not exist in \"%s\".", userField, inputDirectory)); + } + return inputPath; + } else { + return null; + } + } + + @Override + public String convertToUrl(String userField, Path inputDirectory) { + if (userField == null) { + return null; + } + try { + if (userField.startsWith("http")) { + return new URI(userField).toURL().toString(); + } + return inputDirectory.resolve(userField).toFile().toString(); + } catch (MalformedURLException | URISyntaxException e) { + return null; + } + } + // Utilities /** diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java index 6b71dab3..f17608bd 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java @@ -6,12 +6,7 @@ import fr.insee.kraftwerk.core.inputs.UserInputsFile; import javax.annotation.Nullable; -import java.io.File; import java.io.InputStream; -import java.net.MalformedURLException; -import java.net.URI; -import java.net.URISyntaxException; -import java.net.URL; import java.nio.file.Path; import java.time.LocalDateTime; import java.time.format.DateTimeFormatter; @@ -41,34 +36,11 @@ static Path transformToTemp(Path inDirectory) { * Change /some/path/in/campaign-name to /some/path/__other__/campaign-name */ private static Path transformToOther(Path inDirectory, String other) { - return "in".equals(inDirectory.getFileName().toString()) ? inDirectory.getParent().resolve(other) - : transformToOther(inDirectory.getParent(), other).resolve(inDirectory.getFileName()); - } - - static Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException { - if (userField != null && !"null".equals(userField) && !userField.isEmpty()) { - Path inputPath = inputDirectory.resolve(userField); - if (!new File(inputPath.toUri()).exists()) { - throw new KraftwerkException(400, String.format("The input folder \"%s\" does not exist in \"%s\".", userField, inputDirectory)); - } - return inputPath; - } else { - return null; - } - } - - static URL convertToUrl(String userField, Path inputDirectory) { - if (userField == null) { - return null; - } - try { - if (userField.startsWith("http")) { - return new URI(userField).toURL(); - } - return inputDirectory.resolve(userField).toFile().toURI().toURL(); - } catch (MalformedURLException | URISyntaxException e) { - return null; + if("in".equals(inDirectory.getFileName().toString()) && inDirectory.getParent() != null){ + return inDirectory.getParent().resolve(other); } + return "in".equals(inDirectory.getFileName().toString()) ? Path.of(other) + : transformToOther(inDirectory.getParent(), other).resolve(inDirectory.getFileName()); } //Methods to implement @@ -160,6 +132,8 @@ static URL convertToUrl(String userField, Path inputDirectory) { long getSizeOf(String path); //Misc. + Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException; + String convertToUrl(String userField, Path inputDirectory); /** * Move the input file to another directory to archive it */ diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java index 9b795177..3d9670a3 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -21,6 +21,7 @@ import lombok.extern.slf4j.Slf4j; import java.io.ByteArrayInputStream; +import java.io.File; import java.io.FileInputStream; import java.io.InputStream; import java.net.MalformedURLException; @@ -94,7 +95,7 @@ public List listFileNames(String dir) { try { ArrayList filePaths = new ArrayList<>(); Iterable> results = minioClient.listObjects( - ListObjectsArgs.builder().bucket(bucketName).prefix(dir).recursive(true).build()); + ListObjectsArgs.builder().bucket(bucketName).prefix(dir.replace("\\","/")).recursive(true).build()); for (Result result : results) { filePaths.add(result.get().objectName()); @@ -108,7 +109,7 @@ public List listFileNames(String dir) { @Override public List listFilePaths(String dir) { - return listFileNames(dir); + return listFileNames(dir.replace("\\","/")); } @Override @@ -126,14 +127,14 @@ public Boolean isDirectory(String path){ try { //List files of parent to check if directory Iterable> results = minioClient.listObjects( - ListObjectsArgs.builder().bucket(bucketName).prefix(Path.of(path).getParent().toString()).recursive(true).build()); + ListObjectsArgs.builder().bucket(bucketName).prefix(Path.of(path).getParent().toString().replace("\\","/")).recursive(true).build()); for (Result result : results) { - if(result.get().objectName().equals(Path.of(path).getFileName().toString())){ - return result.get().isDir(); + if(result.get().objectName().startsWith(path)){ + return true; } } - log.warn("S3 File or folder {} not found in {}", Path.of(path).getFileName().toString(), Path.of(path).getParent().toString()); + log.warn("S3 File or folder {} not found in {}", Path.of(path).getFileName().toString().replace("\\","/"), Path.of(path).getParent().toString().replace("\\","/")); return null; } catch (Exception e) { log.error(e.toString()); @@ -144,7 +145,7 @@ public Boolean isDirectory(String path){ @Override public long getSizeOf(String path) { try { - StatObjectResponse objectStat = minioClient.statObject(StatObjectArgs.builder().bucket(bucketName).object(path).build()); + StatObjectResponse objectStat = minioClient.statObject(StatObjectArgs.builder().bucket(bucketName).object(path.replace("\\","/")).build()); return objectStat.size(); }catch (Exception e){ log.error(e.toString()); @@ -155,21 +156,21 @@ public long getSizeOf(String path) { @Override public void writeFile(String path, String toWrite, boolean replace) { InputStream inputStream = new ByteArrayInputStream(toWrite.getBytes()); - writeFileOnMinio(path, inputStream, toWrite.length()); + writeFileOnMinio(path.replace("\\","/"), inputStream, toWrite.length()); } @Override public String findFile(String directory, String fileRegex) throws KraftwerkException { - try (Stream files = listFileNames(directory).stream().filter(s -> s.matches(fileRegex))) { + try (Stream files = listFileNames(directory.replace("\\","/")).stream().filter(s -> s.matches(fileRegex))) { return files.findFirst() - .orElseThrow(() -> new KraftwerkException(404, "No DDI file (ddi*.xml) found in " + directory)); + .orElseThrow(() -> new KraftwerkException(404, "No DDI file (ddi*.xml) found in " + directory.replace("\\","/"))); } } @Override public InputStream readFile(String minioPath) { try { - return minioClient.getObject(GetObjectArgs.builder().bucket(bucketName).object(minioPath).build()); + return minioClient.getObject(GetObjectArgs.builder().bucket(bucketName).object(minioPath.replace("\\","/")).build()); } catch (Exception e) { log.error(e.toString()); return null; @@ -179,7 +180,7 @@ public InputStream readFile(String minioPath) { @Override public boolean isFileExists(String objectPath) { try { - minioClient.statObject(StatObjectArgs.builder().bucket(bucketName).object(objectPath).build()); + minioClient.statObject(StatObjectArgs.builder().bucket(bucketName).object(objectPath.replace("\\","/")).build()); return true; } catch (ErrorResponseException e) { return false; @@ -192,19 +193,19 @@ public boolean isFileExists(String objectPath) { @Override public void moveFile(String srcMinioPath, String dstMinioPath) throws KraftwerkException { try { - copyFile(srcMinioPath, dstMinioPath); + copyFile(srcMinioPath.replace("\\","/"), dstMinioPath.replace("\\","/")); deleteFile(srcMinioPath); } catch (Exception e) { - throw new KraftwerkException(500, "Can't move file " + srcMinioPath + " to " + dstMinioPath); + throw new KraftwerkException(500, "Can't move file " + srcMinioPath.replace("\\","/") + " to " + dstMinioPath.replace("\\","/")); } } @Override public void moveFile(Path fileSystemPath, String dstMinioPath) throws KraftwerkException { try (InputStream inputStream = new FileInputStream(fileSystemPath.toFile())){ - writeFileOnMinio(dstMinioPath, inputStream, Files.size(fileSystemPath)); + writeFileOnMinio(dstMinioPath.replace("\\","/"), inputStream, Files.size(fileSystemPath)); } catch (Exception e) { - throw new KraftwerkException(500, "Can't move file " + fileSystemPath + " to " + dstMinioPath); + throw new KraftwerkException(500, "Can't move file " + fileSystemPath + " to " + dstMinioPath.replace("\\","/")); } try { Files.deleteIfExists(fileSystemPath); @@ -213,11 +214,41 @@ public void moveFile(Path fileSystemPath, String dstMinioPath) throws KraftwerkE } } + @Override + public Path convertToPath(String userField, Path inputDirectory) throws KraftwerkException { + if (userField != null && !"null".equals(userField) && !userField.isEmpty()) { + Path inputPath = inputDirectory.resolve(userField); + if (Boolean.FALSE.equals(isDirectory(inputPath.toString().replace("\\","/"))) + || isDirectory(inputPath.toString().replace("\\","/")) == null + ) { + throw new KraftwerkException(400, String.format("The input folder \"%s\" does not exist in \"%s\".", userField, inputDirectory)); + } + return inputPath; + } else { + return null; + } + } + + @Override + public String convertToUrl(String userField, Path inputDirectory) { + if (userField == null) { + return null; + } + try { + if (userField.startsWith("http")) { + return new URI(userField).toURL().toString(); + } + return inputDirectory.resolve(userField).toString(); + } catch (MalformedURLException | URISyntaxException e) { + return null; + } + } + //Utilities private void writeFileOnMinio(String minioPath, InputStream inputStream, long fileSize) { try { - minioClient.putObject(PutObjectArgs.builder().bucket(bucketName).stream(inputStream, fileSize, -1).object(minioPath).build()); + minioClient.putObject(PutObjectArgs.builder().bucket(bucketName).stream(inputStream, fileSize, -1).object(minioPath.replace("\\","/")).build()); } catch (Exception e) { log.error(e.toString()); } @@ -225,7 +256,7 @@ private void writeFileOnMinio(String minioPath, InputStream inputStream, long fi private void copyFile(String srcMinioPath, String dstMinioPath) { try { - CopySource copySource = CopySource.builder().bucket(bucketName).object(srcMinioPath).build(); + CopySource copySource = CopySource.builder().bucket(bucketName).object(srcMinioPath.replace("\\","/")).build(); minioClient.copyObject(CopyObjectArgs.builder().bucket(bucketName).object(dstMinioPath).source(copySource).build()); } catch (Exception e) { log.error(e.toString()); @@ -234,7 +265,7 @@ private void copyFile(String srcMinioPath, String dstMinioPath) { private void moveDirectory(String srcMinioPath, String dstMinioPath) { try { - for (String filePath : listFileNames(srcMinioPath)) { + for (String filePath : listFileNames(srcMinioPath.replace("\\","/"))) { moveFile(filePath, dstMinioPath + "/" + extractFileName(filePath)); } } catch (Exception e) { @@ -246,12 +277,12 @@ private String extractFileName(String filePath) { if (filePath == null || filePath.isEmpty()) { return ""; } - return Path.of(filePath).getFileName().toString(); + return Path.of(filePath).getFileName().toString().replace("\\","/"); } private void deleteFile(String minioPath) { try { - minioClient.removeObject(RemoveObjectArgs.builder().bucket(bucketName).object(minioPath).build()); + minioClient.removeObject(RemoveObjectArgs.builder().bucket(bucketName).object(minioPath.replace("\\","/")).build()); } catch (Exception e) { log.error(e.toString()); } @@ -276,7 +307,7 @@ private void archiveData(Path inputFolder, String campaignName, ModeInputs modeI private void archiveParadata(Path inputFolder, String campaignName, ModeInputs modeInputs){ if (modeInputs.getParadataFolder() != null) { moveDirectory(modeInputs.getParadataFolder().toString(), inputFolder.resolve(ARCHIVE) - .resolve(getRoot(modeInputs.getParadataFolder(), campaignName)).toString()); + .resolve(getRoot(modeInputs.getParadataFolder(), campaignName)).toString().replace("\\","/")); } } @@ -286,7 +317,7 @@ private void archiveParadata(Path inputFolder, String campaignName, ModeInputs m private void archiveReportingData(Path inputFolder, String campaignName, ModeInputs modeInputs){ if (modeInputs.getReportingDataFile() != null) { moveDirectory(modeInputs.getReportingDataFile().toString(), inputFolder.resolve(ARCHIVE) - .resolve(getRoot(modeInputs.getReportingDataFile(), campaignName)).toString()); + .resolve(getRoot(modeInputs.getReportingDataFile(), campaignName)).toString().replace("\\","/")); } } @@ -300,6 +331,6 @@ private String getRoot(Path path, String campaignName) { result.append(sep).append(directory); sep = "/"; } - return result.toString(); + return result.toString().replace("\\","/"); } } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformer.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformer.java index 99def2a6..d5788027 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformer.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformer.java @@ -13,34 +13,33 @@ import javax.xml.transform.stream.StreamResult; import javax.xml.transform.stream.StreamSource; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; +import lombok.AllArgsConstructor; import lombok.extern.log4j.Log4j2; @Log4j2 +@AllArgsConstructor public class SaxonTransformer { + private FileUtilsInterface fileUtilsInterface; /** * XSL transformation method using Saxon. * - * @param inputXmlURL : URL of the XML input file + * @param inputXmlPath : Path of the XML input file * @param inputXslPath : Path to the XSL file from the resources folder of the * application * @param outputXmlPath : Path to the XML output file which will be created */ - public void xslTransform(URL inputXmlURL, String inputXslPath, Path outputXmlPath) { - log.info("About to transform the file from URL: " + inputXmlURL); + public void xslTransform(String inputXmlPath, String inputXslPath, Path outputXmlPath) { + log.info("About to transform the file: " + inputXmlPath); log.info("using the XSL file " + inputXslPath); // Get the XML input file StreamSource xmlSource; InputStream xmlInput; - try { - xmlInput = inputXmlURL.openStream(); - xmlSource = new StreamSource(xmlInput); - xmlSource.setSystemId(inputXmlURL.toString()); - } catch (IOException e) { - log.error(String.format("IOException when trying to read file from URL: %s", inputXmlURL), e); - return; // to break here if the xml input file is not found - } + xmlInput = fileUtilsInterface.readFile(inputXmlPath); + xmlSource = new StreamSource(xmlInput); + xmlSource.setSystemId(inputXmlPath); // Get the XSL file StreamSource xslSource; @@ -86,13 +85,6 @@ public void xslTransform(Path inputXmlPath, String inputXslPath, Path outputXmlP log.info("About to transform the file " + inputXmlPath); log.info("using the XSL file " + inputXslPath); - try { - URL inputXmlUrl = inputXmlPath.toUri().toURL(); - xslTransform(inputXmlUrl, inputXslPath, outputXmlPath); - } catch (MalformedURLException e) { - log.error(String.format("Error when converting file path '%s' to an URL.", inputXmlPath), e); - } - + xslTransform(inputXmlPath.toString(), inputXslPath, outputXmlPath); } - } \ No newline at end of file diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java index 3a21e572..1d4e4811 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/inputs/UserInputsFileTest.java @@ -29,7 +29,7 @@ class UserInputsFileTest { @Test void testReadValidUserInput_singleMode() throws KraftwerkException { UserInputsFile userInputsFile = new UserInputsFile( - inputSamplesDirectory.resolve("kraftwerk.json"), + inputSamplesDirectory.resolve("inputs_valid.json"), inputSamplesDirectory, fileUtilsInterface); // ModeInputs modeInputs = userInputsFile.getModeInputs("CAPI"); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/DDIReaderTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/DDIReaderTest.java index 70697ecc..fbc72ae3 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/DDIReaderTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/DDIReaderTest.java @@ -45,7 +45,7 @@ void readSimpsonsV1Variables() throws MalformedURLException, KraftwerkException, "SURVEY_COMMENT"); MetadataModel simpsonsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V1), fileUtilsInterface); + .getMetadataFromDDI(DDI_FOLDER + "/" + DDI_SIMPSONS_V1, fileUtilsInterface); // assertNotNull(simpsonsMetadata); @@ -83,7 +83,7 @@ void readSimpsonsV2Variables() throws MalformedURLException, KraftwerkException, "FEELCHAREV4", "LEAVDURATION11", "LEAVDURATION52", "NB_CHAR", "SURVEY_COMMENT"); MetadataModel simpsonsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V2), fileUtilsInterface); + .getMetadataFromDDI(DDI_FOLDER + "/" + DDI_SIMPSONS_V2, fileUtilsInterface); // assertNotNull(simpsonsMetadata); @@ -111,7 +111,7 @@ void readVqsWebVariables() throws MalformedURLException, KraftwerkException, URI "RESIDM", "NHAB"); MetadataModel vqsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_WEB), fileUtilsInterface); + .getMetadataFromDDI(DDI_FOLDER + "/" + DDI_VQS_WEB.toString(), fileUtilsInterface); // assertNotNull(vqsMetadata); @@ -151,7 +151,7 @@ void readVqsPapVariables() throws MalformedURLException, KraftwerkException, URI "AIDREG_B", "AIDREG_C", "AIDREG_D", "RESID", "RESIDANCIEN", "NBQUEST"); MetadataModel vqsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_PAP), fileUtilsInterface); + .getMetadataFromDDI(DDI_FOLDER + "/" + DDI_VQS_PAP, fileUtilsInterface); // assertNotNull(vqsMetadata); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/LunaticReaderTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/LunaticReaderTest.java index fce0af37..ae480ce3 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/LunaticReaderTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/LunaticReaderTest.java @@ -1,6 +1,8 @@ package fr.insee.kraftwerk.core.metadata; import fr.insee.kraftwerk.core.TestConstants; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.utils.files.FileUtilsInterface; import org.junit.jupiter.api.Test; import java.nio.file.Path; @@ -11,12 +13,13 @@ class LunaticReaderTest { static final Path lunaticSamplesPath = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "lunatic"); + static final FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); @Test void readLogX21TelLunaticFile() { // CalculatedVariables calculatedVariables = LunaticReader.getCalculatedFromLunatic( - lunaticSamplesPath.resolve("log2021x21_tel.json")); + lunaticSamplesPath.resolve("log2021x21_tel.json"), fileUtilsInterface); // assertNotNull(calculatedVariables); @@ -41,7 +44,7 @@ void readLogX21TelLunaticFile() { void readLogX22WebLunaticFile() { // CalculatedVariables calculatedVariables = LunaticReader.getCalculatedFromLunatic( - lunaticSamplesPath.resolve("log2021x22_web.json")); + lunaticSamplesPath.resolve("log2021x22_web.json"), fileUtilsInterface); // assertNotNull(calculatedVariables); @@ -55,7 +58,7 @@ void readLogX22WebLunaticFile() { void readVariablesFromLogX21WebLunaticFile() { // MetadataModel variables = LunaticReader.getMetadataFromLunatic( - lunaticSamplesPath.resolve("log2021x21_web.json")); + lunaticSamplesPath.resolve("log2021x21_web.json"), fileUtilsInterface); // assertNotNull(variables); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/VariableTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/VariableTest.java index 9288af0a..1e2941a1 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/VariableTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/metadata/VariableTest.java @@ -37,7 +37,7 @@ void readSimpsonsV1Variables() throws MalformedURLException, KraftwerkException, "SURVEY_COMMENT"); MetadataModel simpsonsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V1), fileUtilsInterface); + .getMetadataFromDDI(DDI_FOLDER + "/" + DDI_SIMPSONS_V1, fileUtilsInterface); // assertNotNull(simpsonsMetadata); @@ -75,7 +75,7 @@ void readSimpsonsV2Variables() throws MalformedURLException, KraftwerkException, "FEELCHAREV4", "LEAVDURATION11", "LEAVDURATION52", "NB_CHAR", "SURVEY_COMMENT"); MetadataModel simpsonsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_SIMPSONS_V2), fileUtilsInterface); + .getMetadataFromDDI(DDI_FOLDER + "/" + DDI_SIMPSONS_V2.toString(), fileUtilsInterface); // assertNotNull(simpsonsMetadata); @@ -103,7 +103,7 @@ void readVqsWebVariables() throws MalformedURLException, KraftwerkException, URI "RESIDM", "NHAB"); MetadataModel vqsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_WEB), fileUtilsInterface); + .getMetadataFromDDI(DDI_FOLDER + "/" + DDI_VQS_WEB, fileUtilsInterface); // assertNotNull(vqsMetadata); @@ -143,7 +143,7 @@ void readVqsPapVariables() throws MalformedURLException, KraftwerkException, URI "AIDREG_B", "AIDREG_C", "AIDREG_D", "RESID", "RESIDANCIEN", "NBQUEST"); MetadataModel vqsMetadata = DDIReader - .getMetadataFromDDI(Constants.convertToUrl(DDI_FOLDER + "/" + DDI_VQS_PAP), fileUtilsInterface); + .getMetadataFromDDI(DDI_FOLDER + "/" + DDI_VQS_PAP, fileUtilsInterface); // assertNotNull(vqsMetadata); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java index e1b58487..d17b2a03 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBindingsSequenceTest.java @@ -30,7 +30,7 @@ class BuildBindingsSequenceTest { void buildVtlBindings_errorWithoutMetadata() throws KraftwerkException { //GIVEN UserInputsFile userInputsFile = new UserInputsFile( - inputSamplesDirectory.resolve("kraftwerk.json"), + inputSamplesDirectory.resolve("inputs_valid.json"), inputSamplesDirectory, fileUtilsInterface); String dataMode = "CAPI"; VtlBindings vtlBindings = new VtlBindings(); @@ -50,7 +50,7 @@ void buildVtlBindings_errorWithoutMetadata() throws KraftwerkException { void buildVtlBindings_success_changingDdi_and_reportingData(boolean withDdi, boolean withAllReportingData ) throws KraftwerkException { //GIVEN UserInputsFile userInputsFile = new UserInputsFile( - inputSamplesDirectory.resolve("kraftwerk.json"), + inputSamplesDirectory.resolve("inputs_valid.json"), inputSamplesDirectory, fileUtilsInterface); String dataMode = "CAPI"; VtlBindings vtlBindings = new VtlBindings(); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java index 02fe2119..8eb1d00c 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java @@ -5,6 +5,7 @@ import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.inputs.UserInputsFile; import org.assertj.core.api.Assertions; +import org.junit.Assert; import org.junit.jupiter.api.Test; import java.io.File; @@ -306,4 +307,41 @@ void moveFileTest_FromPath() throws KraftwerkException, IOException { Files.deleteIfExists(inputDirectory.resolve("test1.txt")); Files.deleteIfExists(inputDirectory2); } + + + + @Test + void convertToPathTest_nullUserField() throws KraftwerkException { + Assertions.assertThat(fileSystemImpl.convertToPath(null,null)).isNull(); + } + + @Test + void convertToPathTest_directoryNotExists(){ + Assert.assertThrows(KraftwerkException.class, () -> fileSystemImpl.convertToPath("test", Path.of("NOT SUPPOSED TO EXIST"))); + } + + @Test + void convertToPathTest() throws KraftwerkException { + //GIVEN + String campaignName = "convert_path"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN+THEN + Assertions.assertThat(fileSystemImpl.convertToPath("test.txt", inputDirectory)).exists(); + } + + @Test + void convertToURLTest_nullUserField(){ + Assertions.assertThat(fileSystemImpl.convertToUrl(null,null)).isNull(); + } + + @Test + void convertToURLTest(){ + //GIVEN + String campaignName = "convert_path"; + Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); + + //WHEN+THEN + Assertions.assertThat(fileSystemImpl.convertToUrl("test.txt", inputDirectory)).endsWith("test.txt"); + } } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java index f1c2c4b4..4a799379 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemInterfaceTest.java @@ -25,40 +25,5 @@ void testTransformToOut2() { assertEquals(path, FileUtilsInterface.transformToOut(Paths.get("C://Users/in/Kraftwerk/src/test/resources/functional_tests/in/VQS"), LocalDateTime.now()).getParent()); } - @Test - void convertToPathTest_nullUserField() throws KraftwerkException { - Assertions.assertThat(FileUtilsInterface.convertToPath(null,null)).isNull(); - } - - @Test - void convertToPathTest_directoryNotExists(){ - Assert.assertThrows(KraftwerkException.class, () -> FileUtilsInterface.convertToPath("test", Path.of("NOT SUPPOSED TO EXIST"))); - } - - @Test - void convertToPathTest() throws KraftwerkException { - //GIVEN - String campaignName = "convert_path"; - Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); - - //WHEN+THEN - Assertions.assertThat(FileUtilsInterface.convertToPath("test.txt", inputDirectory)).exists(); - } - - @Test - void convertToURLTest_nullUserField(){ - Assertions.assertThat(FileUtilsInterface.convertToUrl(null,null)).isNull(); - } - - @Test - void convertToURLTest(){ - //GIVEN - String campaignName = "convert_path"; - Path inputDirectory = Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "files", campaignName); - - //WHEN+THEN - Assertions.assertThat(FileUtilsInterface.convertToUrl("test.txt", inputDirectory).getFile()).endsWith("test.txt"); - } - } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/MinioImplTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/MinioImplTest.java deleted file mode 100644 index 70aa5fd4..00000000 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/MinioImplTest.java +++ /dev/null @@ -1,4 +0,0 @@ -package fr.insee.kraftwerk.core.utils.files; - -public class MinioImplTest { -} diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java index 700437e3..6a0d986e 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java @@ -21,7 +21,7 @@ void applyXsltScript(){ String inXmlFile = TestConstants.UNIT_TESTS_DIRECTORY + "/utils/xsl/note.xml"; String outXmlFile = TestConstants.UNIT_TESTS_DUMP + "/xsl-output.xml"; // - SaxonTransformer saxonTransformer = new SaxonTransformer(); + SaxonTransformer saxonTransformer = new SaxonTransformer(fileUtilsInterface); saxonTransformer.xslTransform(Path.of(inXmlFile), xsltTestScript,Path.of(outXmlFile)); // String inContent = TextFileReader.readFromPath(Path.of(inXmlFile), fileUtilsInterface); diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/CalculatedProcessingDefinition.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/CalculatedProcessingDefinition.java index 28159230..5ca525fc 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/CalculatedProcessingDefinition.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/CalculatedProcessingDefinition.java @@ -65,7 +65,7 @@ public void getCampaignFiles(String campaignName, String dataMode) throws Malfor this.dataMode = dataMode; // metadataModel = DDIReader.getMetadataFromDDI( - Constants.convertToUrl(campaignPacks.get(campaignName).get(dataMode).get("ddi")), new FileSystemImpl()); + Constants.convertToUrl(campaignPacks.get(campaignName).get(dataMode).get("ddi")).toString(), new FileSystemImpl()); // SurveyRawData data = new SurveyRawData(); data.setMetadataModel(metadataModel); @@ -80,7 +80,7 @@ public void getCampaignFiles(String campaignName, String dataMode) throws Malfor public void readCampaignData() { // CalculatedVariables calculatedVariables = LunaticReader.getCalculatedFromLunatic( - Path.of(campaignPacks.get(campaignName).get(dataMode).get("lunatic"))); + Path.of(campaignPacks.get(campaignName).get(dataMode).get("lunatic")), new FileSystemImpl()); DataProcessing calculatedProcessing = new CalculatedProcessing(vtlBindings,calculatedVariables, new FileSystemImpl()); calculatedProcessing.applyVtlTransformations("TEST", null,errors); // diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/DDIGetterDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/DDIGetterDefinitions.java index 16224751..8646bc65 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/DDIGetterDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/DDIGetterDefinitions.java @@ -43,8 +43,8 @@ public void compare_ddi(String nameDDI) throws IOException, URISyntaxException { tempFile.deleteOnExit(); Path tempPath = Paths.get(tempFile.getAbsolutePath()); URL url = new URI(linkDDI).toURL(); - SaxonTransformer transformer = new SaxonTransformer(); - transformer.xslTransform(url, Constants.XSLT_STRUCTURED_VARIABLES, tempPath); + SaxonTransformer transformer = new SaxonTransformer(new FileSystemImpl()); + transformer.xslTransform(url.toString(), Constants.XSLT_STRUCTURED_VARIABLES, tempPath); actualString = TextFileReader.readFromPath(tempPath, new FileSystemImpl()); diff --git a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/VariablesGetterDefinitions.java b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/VariablesGetterDefinitions.java index 6a469758..9680470e 100644 --- a/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/VariablesGetterDefinitions.java +++ b/kraftwerk-functional-tests/src/test/java/cucumber/functional_tests/VariablesGetterDefinitions.java @@ -32,7 +32,7 @@ public void set_linkDDI(String linkDDI) throws MalformedURLException, URISyntaxE @When("I try to collect the variables's infos") public void collect_variables() throws KraftwerkException { - metadataModel = DDIReader.getMetadataFromDDI(linkDDI, new FileSystemImpl()); + metadataModel = DDIReader.getMetadataFromDDI(linkDDI.toString(), new FileSystemImpl()); } @Then("The variables I try to count should answer {int} and have {string} in it") From edc802f028e6208dc5dce4ef38c771369e0ab946 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Wed, 26 Jun 2024 08:44:17 +0200 Subject: [PATCH 27/46] Removed unused --- .../java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java | 2 +- .../fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java | 1 - 2 files changed, 1 insertion(+), 2 deletions(-) diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java index 6815c205..1e232805 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/inputs/UserInputsGenesis.java @@ -22,7 +22,7 @@ public class UserInputsGenesis extends UserInputs{ private final List modes; - public UserInputsGenesis(boolean hasConfigFile, Path inputDirectory, List modes, FileUtilsInterface fileUtilsInterface) throws KraftwerkException, IOException { + public UserInputsGenesis(boolean hasConfigFile, Path inputDirectory, List modes, FileUtilsInterface fileUtilsInterface) throws KraftwerkException { super(inputDirectory, fileUtilsInterface); this.hasConfigFile = hasConfigFile; this.modes=modes; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java index 6cb281cb..43e6218e 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileSystemImpl.java @@ -16,7 +16,6 @@ import java.net.MalformedURLException; import java.net.URI; import java.net.URISyntaxException; -import java.net.URL; import java.nio.file.Files; import java.nio.file.Path; import java.nio.file.StandardCopyOption; From aa7a18c37f42f695901e49232d9c76f330859206 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Wed, 26 Jun 2024 09:48:42 +0200 Subject: [PATCH 28/46] Fix http URL case --- .../fr/insee/kraftwerk/core/metadata/DDIReader.java | 2 +- .../kraftwerk/core/utils/xsl/SaxonTransformer.java | 11 ++++++++--- .../core/utils/xsl/SaxonTransformerTest.java | 3 ++- 3 files changed, 11 insertions(+), 5 deletions(-) diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java index c4933525..bfa5beb2 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/metadata/DDIReader.java @@ -77,7 +77,7 @@ public static MetadataModel getMetadataFromDDI(String ddiUrlString, FileUtilsInt * @param ddiUrlString : URL of the DDI file. * @param variablesFilePath : Path of the 'variables.xml' file to be generated. */ - private static void transformDDI(String ddiUrlString, Path variablesFilePath, FileUtilsInterface fileUtilsInterface) { + private static void transformDDI(String ddiUrlString, Path variablesFilePath, FileUtilsInterface fileUtilsInterface) throws IOException { SaxonTransformer saxonTransformer = new SaxonTransformer(fileUtilsInterface); saxonTransformer.xslTransform(ddiUrlString, Constants.XSLT_STRUCTURED_VARIABLES, variablesFilePath); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformer.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformer.java index d5788027..5267ae5f 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformer.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformer.java @@ -3,6 +3,7 @@ import java.io.IOException; import java.io.InputStream; import java.net.MalformedURLException; +import java.net.URI; import java.net.URL; import java.nio.file.Path; @@ -30,14 +31,18 @@ public class SaxonTransformer { * application * @param outputXmlPath : Path to the XML output file which will be created */ - public void xslTransform(String inputXmlPath, String inputXslPath, Path outputXmlPath) { + public void xslTransform(String inputXmlPath, String inputXslPath, Path outputXmlPath) throws IOException { log.info("About to transform the file: " + inputXmlPath); log.info("using the XSL file " + inputXslPath); // Get the XML input file StreamSource xmlSource; InputStream xmlInput; - xmlInput = fileUtilsInterface.readFile(inputXmlPath); + if(inputXmlPath.startsWith("http")){ + xmlInput = URI.create(inputXmlPath).toURL().openStream(); + }else{ + xmlInput = fileUtilsInterface.readFile(inputXmlPath); + } xmlSource = new StreamSource(xmlInput); xmlSource.setSystemId(inputXmlPath); @@ -81,7 +86,7 @@ public void xslTransform(String inputXmlPath, String inputXslPath, Path outputXm * application * @param outputXmlPath : Path to the XML output file which will be created */ - public void xslTransform(Path inputXmlPath, String inputXslPath, Path outputXmlPath) { + public void xslTransform(Path inputXmlPath, String inputXslPath, Path outputXmlPath) throws IOException { log.info("About to transform the file " + inputXmlPath); log.info("using the XSL file " + inputXslPath); diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java index 6a0d986e..07b0d933 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/xsl/SaxonTransformerTest.java @@ -1,5 +1,6 @@ package fr.insee.kraftwerk.core.utils.xsl; +import java.io.IOException; import java.net.MalformedURLException; import java.nio.file.Path; @@ -16,7 +17,7 @@ class SaxonTransformerTest { FileUtilsInterface fileUtilsInterface = new FileSystemImpl(); @Test - void applyXsltScript(){ + void applyXsltScript() throws IOException { String xsltTestScript = TestConstants.UNIT_TESTS_DIRECTORY + "/utils/xsl/do-nothing.xsl"; String inXmlFile = TestConstants.UNIT_TESTS_DIRECTORY + "/utils/xsl/note.xml"; String outXmlFile = TestConstants.UNIT_TESTS_DUMP + "/xsl-output.xml"; From 4c9d5df2a434a305e8acdc6be4292d83b2018cd3 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Wed, 26 Jun 2024 09:59:26 +0200 Subject: [PATCH 29/46] Update FileSystemImplTest.java --- .../fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java | 2 +- 1 file changed, 1 insertion(+), 1 deletion(-) diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java index 8eb1d00c..963d5b16 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/files/FileSystemImplTest.java @@ -129,7 +129,7 @@ void listFileNamesTest(){ List fileNames = fileSystemImpl.listFileNames(inputDirectory.toString()); //THEN - Assertions.assertThat(fileNames).containsExactly("file1.txt","file2.json","file3.xml"); + Assertions.assertThat(fileNames).contains("file1.txt","file2.json","file3.xml"); } @Test From 6edb6d860069a045d549abfc6ec8f18223cc044d Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Wed, 26 Jun 2024 13:43:40 +0200 Subject: [PATCH 30/46] Update KraftwerkBatch.java --- .../java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java index 58fba5e8..3ef30604 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java @@ -92,10 +92,10 @@ private static void checkArgs(String[] args) throws IllegalArgumentException{ throw new IllegalArgumentException("Invalid number of arguments ! Got %s instead of 4 !".formatted(args.length)); } if(!args[1].equals("true") && !args[1].equals("false")){ - throw new IllegalArgumentException("Invalid archiveAtEnd boolean argument !"); + throw new IllegalArgumentException("Invalid archiveAtEnd boolean argument ! : %s".formatted(args[1])); } if(!args[2].equals("true") && !args[2].equals("false")){ - throw new IllegalArgumentException("Invalid withAllReportingData boolean argument !"); + throw new IllegalArgumentException("Invalid withAllReportingData boolean argument ! %s".formatted(args[2])); } } } From 832f06e00309de6c4083796cb57383c2e57de23b Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Wed, 26 Jun 2024 15:52:55 +0200 Subject: [PATCH 31/46] Overwrite default directory if MinIO enabled --- .../java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java | 5 +++++ 1 file changed, 5 insertions(+) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java index 3ef30604..a64a35a9 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java @@ -61,6 +61,11 @@ public void run(String... args) throws Exception{ archiveAtEnd = false; } + //Replace default directory if using MinIO + if(minioConfig.isEnable()){ + defaultDirectory = ""; + } + //Run kraftwerk if(kraftwerkServiceType == KraftwerkServiceType.GENESIS){ From eb27d6f1a3f3c28175a1597c9c5680ec6b00f507 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Wed, 26 Jun 2024 16:00:24 +0200 Subject: [PATCH 32/46] Overwrite default directory if using MinIO (in services) --- .../kraftwerk/api/services/KraftwerkService.java | 4 ++++ .../insee/kraftwerk/api/services/MainService.java | 10 ++++++++++ .../kraftwerk/api/services/SplitterService.java | 5 +++++ .../kraftwerk/api/services/StepByStepService.java | 14 ++++++++++++++ 4 files changed, 33 insertions(+) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java index dd1a39b6..806657ab 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java @@ -58,6 +58,10 @@ public void initializeWithProperties() { if(minioConfig.isEnable()){ MinioClient minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + //Replace default directory if using MinIO + if(minioConfig.isEnable()){ + defaultDirectory = ""; + } }else{ fileUtilsInterface = new FileSystemImpl(); } diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java index 3eff6461..0304d9ca 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java @@ -48,6 +48,8 @@ public MainService(ConfigProperties configProperties, MinioConfig minioConfig) { if(minioConfig != null && minioConfig.isEnable()){ minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); useMinio = true; + //Replace default directory if using MinIO + defaultDirectory = ""; } } @@ -63,6 +65,8 @@ public ResponseEntity mainService( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + //Replace default directory if using MinIO + defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -92,6 +96,8 @@ public ResponseEntity mainFileByFile( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + //Replace default directory if using MinIO + defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -120,6 +126,8 @@ public ResponseEntity mainLunaticOnly( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + //Replace default directory if using MinIO + defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -143,6 +151,8 @@ public ResponseEntity mainGenesis( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + //Replace default directory if using MinIO + defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java index c8fdbca8..8014dde5 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java @@ -42,6 +42,11 @@ public ResponseEntity saveResponsesFromXmlFile(@RequestParam("inputFolde new MinioImpl(MinioClient.builder().credentials(minioConfig.getAccessKey(),minioConfig.getSecretKey()).endpoint(minioConfig.getEndpoint()).build(), minioConfig.getBucketName()) : new FileSystemImpl(); + if(fileSystemType.equals(FileSystemType.MINIO)){ + //Replace default directory if using MinIO + defaultDirectory = ""; + } + XmlSplitter.split(String.format("%s/in/%s/",defaultDirectory,inputFolder), filename, String.format("%s/in/%s/",defaultDirectory,outputFolder), "SurveyUnit", nbSU, fileUtilsInterface); return new ResponseEntity<>("File split", HttpStatus.OK); } diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java index db707c34..92cdef17 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java @@ -53,6 +53,8 @@ public StepByStepService(MinioConfig minioConfig) { if(minioConfig != null && minioConfig.isEnable()){ minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); useMinio = true; + //Replace default directory if using MinIO + defaultDirectory = ""; } } @@ -68,6 +70,8 @@ public ResponseEntity buildVtlBindings( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + //Replace default directory if using MinIO + defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -112,6 +116,8 @@ public ResponseEntity buildVtlBindingsByDataMode( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + //Replace default directory if using MinIO + defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -149,6 +155,8 @@ public ResponseEntity unimodalProcessing( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + //Replace default directory if using MinIO + defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -197,6 +205,8 @@ public ResponseEntity multimodalProcessing( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + //Replace default directory if using MinIO + defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -254,6 +264,8 @@ public ResponseEntity writeOutputFiles( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + //Replace default directory if using MinIO + defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -300,6 +312,8 @@ public ResponseEntity archiveService( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); + //Replace default directory if using MinIO + defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } From 726c578c509dd28cc3fed3e512a1fda95394c488 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Thu, 27 Jun 2024 09:29:00 +0200 Subject: [PATCH 33/46] Revert "Overwrite default directory if using MinIO (in services)" This reverts commit eb27d6f1a3f3c28175a1597c9c5680ec6b00f507. --- .../kraftwerk/api/services/KraftwerkService.java | 4 ---- .../insee/kraftwerk/api/services/MainService.java | 10 ---------- .../kraftwerk/api/services/SplitterService.java | 5 ----- .../kraftwerk/api/services/StepByStepService.java | 14 -------------- 4 files changed, 33 deletions(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java index 806657ab..dd1a39b6 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/KraftwerkService.java @@ -58,10 +58,6 @@ public void initializeWithProperties() { if(minioConfig.isEnable()){ MinioClient minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); - //Replace default directory if using MinIO - if(minioConfig.isEnable()){ - defaultDirectory = ""; - } }else{ fileUtilsInterface = new FileSystemImpl(); } diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java index 0304d9ca..3eff6461 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java @@ -48,8 +48,6 @@ public MainService(ConfigProperties configProperties, MinioConfig minioConfig) { if(minioConfig != null && minioConfig.isEnable()){ minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); useMinio = true; - //Replace default directory if using MinIO - defaultDirectory = ""; } } @@ -65,8 +63,6 @@ public ResponseEntity mainService( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); - //Replace default directory if using MinIO - defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -96,8 +92,6 @@ public ResponseEntity mainFileByFile( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); - //Replace default directory if using MinIO - defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -126,8 +120,6 @@ public ResponseEntity mainLunaticOnly( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); - //Replace default directory if using MinIO - defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -151,8 +143,6 @@ public ResponseEntity mainGenesis( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); - //Replace default directory if using MinIO - defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java index 8014dde5..c8fdbca8 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/SplitterService.java @@ -42,11 +42,6 @@ public ResponseEntity saveResponsesFromXmlFile(@RequestParam("inputFolde new MinioImpl(MinioClient.builder().credentials(minioConfig.getAccessKey(),minioConfig.getSecretKey()).endpoint(minioConfig.getEndpoint()).build(), minioConfig.getBucketName()) : new FileSystemImpl(); - if(fileSystemType.equals(FileSystemType.MINIO)){ - //Replace default directory if using MinIO - defaultDirectory = ""; - } - XmlSplitter.split(String.format("%s/in/%s/",defaultDirectory,inputFolder), filename, String.format("%s/in/%s/",defaultDirectory,outputFolder), "SurveyUnit", nbSU, fileUtilsInterface); return new ResponseEntity<>("File split", HttpStatus.OK); } diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java index 92cdef17..db707c34 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java @@ -53,8 +53,6 @@ public StepByStepService(MinioConfig minioConfig) { if(minioConfig != null && minioConfig.isEnable()){ minioClient = MinioClient.builder().endpoint(minioConfig.getEndpoint()).credentials(minioConfig.getAccessKey(), minioConfig.getSecretKey()).build(); useMinio = true; - //Replace default directory if using MinIO - defaultDirectory = ""; } } @@ -70,8 +68,6 @@ public ResponseEntity buildVtlBindings( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); - //Replace default directory if using MinIO - defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -116,8 +112,6 @@ public ResponseEntity buildVtlBindingsByDataMode( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); - //Replace default directory if using MinIO - defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -155,8 +149,6 @@ public ResponseEntity unimodalProcessing( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); - //Replace default directory if using MinIO - defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -205,8 +197,6 @@ public ResponseEntity multimodalProcessing( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); - //Replace default directory if using MinIO - defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -264,8 +254,6 @@ public ResponseEntity writeOutputFiles( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); - //Replace default directory if using MinIO - defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } @@ -312,8 +300,6 @@ public ResponseEntity archiveService( FileUtilsInterface fileUtilsInterface; if(Boolean.TRUE.equals(useMinio)){ fileUtilsInterface = new MinioImpl(minioClient, minioConfig.getBucketName()); - //Replace default directory if using MinIO - defaultDirectory = ""; }else{ fileUtilsInterface = new FileSystemImpl(); } From 38b410406b2eea86cd366a0d9dd1f748aac26d96 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Thu, 27 Jun 2024 09:29:03 +0200 Subject: [PATCH 34/46] Revert "Overwrite default directory if MinIO enabled" This reverts commit 832f06e00309de6c4083796cb57383c2e57de23b. --- .../java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java | 5 ----- 1 file changed, 5 deletions(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java index a64a35a9..3ef30604 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java @@ -61,11 +61,6 @@ public void run(String... args) throws Exception{ archiveAtEnd = false; } - //Replace default directory if using MinIO - if(minioConfig.isEnable()){ - defaultDirectory = ""; - } - //Run kraftwerk if(kraftwerkServiceType == KraftwerkServiceType.GENESIS){ From 53dfbe54e82439cfa81368f76195d2f4b939de33 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 28 Jun 2024 11:40:11 +0200 Subject: [PATCH 35/46] Update MinioImpl.java --- .../java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java | 2 -- 1 file changed, 2 deletions(-) diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java index 3d9670a3..af79974c 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -21,13 +21,11 @@ import lombok.extern.slf4j.Slf4j; import java.io.ByteArrayInputStream; -import java.io.File; import java.io.FileInputStream; import java.io.InputStream; import java.net.MalformedURLException; import java.net.URI; import java.net.URISyntaxException; -import java.net.URL; import java.nio.file.Files; import java.nio.file.Path; import java.util.ArrayList; From 0825b3e27792b712fad1f37365690640451c9a6e Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Tue, 2 Jul 2024 15:12:02 +0200 Subject: [PATCH 36/46] fix Genesis endpoint batch --- .../kraftwerk/api/batch/KraftwerkBatch.java | 73 ++++++++++--------- .../api/process/MainProcessingGenesis.java | 3 +- .../kraftwerk/api/services/MainService.java | 1 - .../sequence/ControlInputSequenceGenesis.java | 4 +- .../core/utils/files/FileUtilsInterface.java | 4 +- .../kraftwerk/core/utils/files/MinioImpl.java | 6 +- 6 files changed, 49 insertions(+), 42 deletions(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java index 3ef30604..773c0569 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java @@ -5,6 +5,7 @@ import fr.insee.kraftwerk.api.process.MainProcessing; import fr.insee.kraftwerk.api.process.MainProcessingGenesis; import fr.insee.kraftwerk.api.services.KraftwerkService; +import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.utils.files.MinioImpl; import io.minio.MinioClient; import lombok.extern.slf4j.Slf4j; @@ -37,48 +38,52 @@ public KraftwerkBatch(ConfigProperties configProperties, MinioConfig minioConfig } @Override - public void run(String... args) throws Exception{ - //If .jar launched with cli args - if (args.length > 0) { - log.info("Launching Kraftwerk using cli"); + public void run(String... args) { + try { + //If .jar launched with cli args + if (args.length > 0) { + log.info("Launching Kraftwerk using cli"); - //Check arguments - checkArgs(args); + //Check arguments + checkArgs(args); - //Parse arguments - KraftwerkServiceType kraftwerkServiceType = KraftwerkServiceType.valueOf(args[0]); - boolean archiveAtEnd = Boolean.parseBoolean(args[1]); - boolean withAllReportingData = Boolean.parseBoolean(args[2]); - String inDirectory = args[3]; + //Parse arguments + KraftwerkServiceType kraftwerkServiceType = KraftwerkServiceType.valueOf(args[0]); + boolean archiveAtEnd = Boolean.parseBoolean(args[1]); + boolean withAllReportingData = Boolean.parseBoolean(args[2]); + String inDirectory = args[3]; - //Kraftwerk service type related parameters - boolean fileByFile = kraftwerkServiceType == KraftwerkServiceType.FILE_BY_FILE; - boolean withDDI = kraftwerkServiceType != KraftwerkServiceType.LUNATIC_ONLY; - if(kraftwerkServiceType != KraftwerkServiceType.MAIN){ - withAllReportingData = false; - } - if(kraftwerkServiceType == KraftwerkServiceType.GENESIS){ - archiveAtEnd = false; - } + //Kraftwerk service type related parameters + boolean fileByFile = kraftwerkServiceType == KraftwerkServiceType.FILE_BY_FILE; + boolean withDDI = kraftwerkServiceType != KraftwerkServiceType.LUNATIC_ONLY; + if (kraftwerkServiceType != KraftwerkServiceType.MAIN) { + withAllReportingData = false; + } + if (kraftwerkServiceType == KraftwerkServiceType.GENESIS) { + archiveAtEnd = false; + } - //Run kraftwerk - if(kraftwerkServiceType == KraftwerkServiceType.GENESIS){ - MainProcessingGenesis mainProcessingGenesis = new MainProcessingGenesis(configProperties, new MinioImpl(minioClient, minioConfig.getBucketName())); - mainProcessingGenesis.runMain(inDirectory); - }else{ - MainProcessing mainProcessing = new MainProcessing(inDirectory, fileByFile, withAllReportingData, withDDI, defaultDirectory, limitSize, new MinioImpl(minioClient, minioConfig.getBucketName())); - mainProcessing.runMain(); - } + //Run kraftwerk + if (kraftwerkServiceType == KraftwerkServiceType.GENESIS) { + MainProcessingGenesis mainProcessingGenesis = new MainProcessingGenesis(configProperties, new MinioImpl(minioClient, minioConfig.getBucketName())); + mainProcessingGenesis.runMain(inDirectory); + } else { + MainProcessing mainProcessing = new MainProcessing(inDirectory, fileByFile, withAllReportingData, withDDI, defaultDirectory, limitSize, new MinioImpl(minioClient, minioConfig.getBucketName())); + mainProcessing.runMain(); + } - //Archive - if(Boolean.TRUE.equals(archiveAtEnd)){ - KraftwerkService kraftwerkService = new KraftwerkService(minioConfig); - kraftwerkService.archive(inDirectory, new MinioImpl(minioClient, minioConfig.getBucketName())); + //Archive + if (Boolean.TRUE.equals(archiveAtEnd)) { + KraftwerkService kraftwerkService = new KraftwerkService(minioConfig); + kraftwerkService.archive(inDirectory, new MinioImpl(minioClient, minioConfig.getBucketName())); + } + System.exit(0); } - - System.exit(0); + }catch(Exception e){ + log.error(e.toString()); } + System.exit(1); } /** diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java index 6ccc94d7..b1747c3f 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/process/MainProcessingGenesis.java @@ -63,8 +63,9 @@ public MainProcessingGenesis(ConfigProperties config, FileUtilsInterface fileUti this.fileUtilsInterface = fileUtilsInterface; } - public void init(String idCampaign) throws KraftwerkException, IOException { + public void init(String idCampaign) throws KraftwerkException { log.info("Kraftwerk main service started for campaign: " + idCampaign); + this.controlInputSequenceGenesis = new ControlInputSequenceGenesis("", fileUtilsInterface); this.executionDateTime = LocalDateTime.now(); inDirectory = controlInputSequenceGenesis.getInDirectory(idCampaign); //First we check the modes present in database for the given questionnaire diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java index 3eff6461..c287520a 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/MainService.java @@ -150,7 +150,6 @@ public ResponseEntity mainGenesis( MainProcessingGenesis mpGenesis = new MainProcessingGenesis(configProperties, fileUtilsInterface); try { - mpGenesis.setControlInputSequenceGenesis(new ControlInputSequenceGenesis(defaultDirectory, fileUtilsInterface)); mpGenesis.runMain(idCampaign); } catch (KraftwerkException e) { return ResponseEntity.status(e.getStatus()).body(e.getMessage()); diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequenceGenesis.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequenceGenesis.java index 8d12f1c1..d82b8f63 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequenceGenesis.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/ControlInputSequenceGenesis.java @@ -12,7 +12,7 @@ public class ControlInputSequenceGenesis { String defaultDirectory; - private static final String INPUT_FOLDER = "in"; + private static final String SPEC_FOLDER = "specs"; private final FileUtilsInterface fileUtilsInterface; @Getter @@ -25,7 +25,7 @@ public ControlInputSequenceGenesis(String defaultDirectory, FileUtilsInterface f } public Path getInDirectory(String inDirectoryParam) { - Path inDirectory = Paths.get(defaultDirectory, INPUT_FOLDER, inDirectoryParam); + Path inDirectory = Paths.get(defaultDirectory,SPEC_FOLDER, inDirectoryParam); hasConfigFile = verifyInDirectory(inDirectory); return inDirectory; } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java index f17608bd..2bbc072f 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/FileUtilsInterface.java @@ -36,10 +36,10 @@ static Path transformToTemp(Path inDirectory) { * Change /some/path/in/campaign-name to /some/path/__other__/campaign-name */ private static Path transformToOther(Path inDirectory, String other) { - if("in".equals(inDirectory.getFileName().toString()) && inDirectory.getParent() != null){ + if(("in".equals(inDirectory.getFileName().toString()) || "specs".equals(inDirectory.getFileName().toString())) && inDirectory.getParent() != null){ return inDirectory.getParent().resolve(other); } - return "in".equals(inDirectory.getFileName().toString()) ? Path.of(other) + return "in".equals(inDirectory.getFileName().toString()) || "specs".equals(inDirectory.getFileName().toString()) ? Path.of(other) : transformToOther(inDirectory.getParent(), other).resolve(inDirectory.getFileName()); } diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java index af79974c..4adb2d4e 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/utils/files/MinioImpl.java @@ -159,9 +159,11 @@ public void writeFile(String path, String toWrite, boolean replace) { @Override public String findFile(String directory, String fileRegex) throws KraftwerkException { - try (Stream files = listFileNames(directory.replace("\\","/")).stream().filter(s -> s.matches(fileRegex))) { + //Stream of files with filename matching fileRegex + try (Stream files = listFileNames(directory.replace("\\","/")) + .stream().filter(s -> s.split("/")[s.split("/").length - 1].matches(fileRegex))) { return files.findFirst() - .orElseThrow(() -> new KraftwerkException(404, "No DDI file (ddi*.xml) found in " + directory.replace("\\","/"))); + .orElseThrow(() -> new KraftwerkException(404, "No file with regex " + fileRegex + " found in " + directory.replace("\\","/"))); } } From 0154af1b32a2a0b53580bd597d4ea1a1b5de41a0 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 5 Jul 2024 10:26:39 +0200 Subject: [PATCH 37/46] Fix API mode not launching --- .../fr/insee/kraftwerk/api/batch/KraftwerkBatch.java | 9 ++++++--- 1 file changed, 6 insertions(+), 3 deletions(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java index 773c0569..9f0fa579 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java @@ -5,7 +5,6 @@ import fr.insee.kraftwerk.api.process.MainProcessing; import fr.insee.kraftwerk.api.process.MainProcessingGenesis; import fr.insee.kraftwerk.api.services.KraftwerkService; -import fr.insee.kraftwerk.core.exceptions.KraftwerkException; import fr.insee.kraftwerk.core.utils.files.MinioImpl; import io.minio.MinioClient; import lombok.extern.slf4j.Slf4j; @@ -42,7 +41,7 @@ public void run(String... args) { try { //If .jar launched with cli args if (args.length > 0) { - log.info("Launching Kraftwerk using cli"); + log.info("Launching Kraftwerk in CLI mode..."); //Check arguments checkArgs(args); @@ -83,7 +82,11 @@ public void run(String... args) { }catch(Exception e){ log.error(e.toString()); } - System.exit(1); + if(args.length > 0) { + System.exit(1); + }else{ + log.info("Launching Kraftwerk in API mode..."); + } } /** From 47c8138ef6ea6bd34f9b28bcda322b3df284ee1a Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Thu, 11 Jul 2024 10:00:18 +0200 Subject: [PATCH 38/46] Fixes after conflicts --- .../java/fr/insee/kraftwerk/core/outputs/OutputFiles.java | 2 +- .../kraftwerk/core/outputs/parquet/ParquetOutputFiles.java | 5 +++-- 2 files changed, 4 insertions(+), 3 deletions(-) diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java index 6dab0a5d..9892cdea 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/OutputFiles.java @@ -28,7 +28,7 @@ public abstract class OutputFiles { private final VtlBindings vtlBindings; private final Set datasetToCreate = new HashSet<>(); private final Statement database; - private final FileUtilsInterface fileUtilsInterface; + protected final FileUtilsInterface fileUtilsInterface; /** * When an instance is created, the output folder is created. diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java index e4d64644..7a0f3019 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java @@ -38,11 +38,12 @@ public class ParquetOutputFiles extends OutputFiles { * @param outDirectory Out directory defined in application properties. * @param vtlBindings Vtl bindings where datasets are stored. * @param modes list of modes names - * @param databaseConnection connection to duckDb database + * @param database connection to duckDb database * @param fileUtilsInterface file interface to use (file system or minio) */ - public ParquetOutputFiles(Path outDirectory, VtlBindings vtlBindings, List modes, Statement database, fileUtilsInterface) { + public ParquetOutputFiles(Path outDirectory, VtlBindings vtlBindings, List modes, Statement database, + FileUtilsInterface fileUtilsInterface) { super(outDirectory, vtlBindings, modes, database, fileUtilsInterface); } From 43f2231d6d369ffc1b6f42e72632936196a03ecf Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Thu, 11 Jul 2024 10:00:36 +0200 Subject: [PATCH 39/46] fixes --- .../fr/insee/kraftwerk/api/services/StepByStepService.java | 1 + .../fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java | 2 +- .../java/fr/insee/kraftwerk/core/sequence/WriterSequence.java | 3 ++- 3 files changed, 4 insertions(+), 2 deletions(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java index a0b866ff..be3bfce1 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/StepByStepService.java @@ -28,6 +28,7 @@ import java.nio.file.Path; import java.sql.Connection; import java.sql.SQLException; +import java.sql.Statement; import java.time.LocalDateTime; import java.util.ArrayList; import java.util.List; diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java index ed42885b..c173cbb8 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/csv/CsvOutputFiles.java @@ -78,7 +78,7 @@ public void writeOutputTables(Map metadataModels) throws Files.write(tmpOutputFile.toPath(), buildHeader(columnNames, boolColumnNames, boolColumnIndexes).getBytes()); //Data export into temp file - StringBuilder exportCsvQuery = getExportCsvQuery(datasetName, outputFile, columnNames); + StringBuilder exportCsvQuery = getExportCsvQuery(datasetName, tmpOutputFile, columnNames); this.getDatabase().execute(exportCsvQuery.toString()); //Apply csv format transformations diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java index d34818a7..629cf00b 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/sequence/WriterSequence.java @@ -28,7 +28,8 @@ public void writeOutputFiles(Path inDirectory, VtlBindings vtlBindings, Map modeInputsMap, Map metadataModels, - List errors, + List errors, + KraftwerkExecutionLog kraftwerkExecutionLog, Statement database, FileUtilsInterface fileUtilsInterface) throws KraftwerkException { Path outDirectory = FileUtilsInterface.transformToOut(inDirectory,executionDateTime); From 900f39e686f9b7113a20bd3780cabd6b60ce1c86 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Thu, 11 Jul 2024 11:02:46 +0200 Subject: [PATCH 40/46] refacto try catch batch --- .../java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java | 5 +---- 1 file changed, 1 insertion(+), 4 deletions(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java index 9f0fa579..19927942 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java @@ -81,12 +81,9 @@ public void run(String... args) { } }catch(Exception e){ log.error(e.toString()); - } - if(args.length > 0) { System.exit(1); - }else{ - log.info("Launching Kraftwerk in API mode..."); } + log.info("Launching Kraftwerk in API mode..."); } /** From 4b56be2d675a34abe995ad01cee77e45b127da87 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 12 Jul 2024 11:21:42 +0200 Subject: [PATCH 41/46] Added unit tests to increase coverage --- .../core/data/model/ExternalVariable.java | 3 + .../BuildBIndingsSequenceGenesisTest.java | 98 +++++++++++ .../kraftwerk/core/utils/SqlUtilsTest.java | 25 +++ .../utils/log/KraftwerkExecutionLogTest.java | 35 ++++ .../genesis/WEB/PARADATA/paradataTest.json | 159 ++++++++++++++++++ .../WEB/REPORTING_DATA/reportingdata.csv | 2 + .../WEB/REPORTING_DATA/reportingdata.xml | 155 +++++++++++++++++ 7 files changed, 477 insertions(+) create mode 100644 kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBIndingsSequenceGenesisTest.java create mode 100644 kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/log/KraftwerkExecutionLogTest.java create mode 100644 kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/PARADATA/paradataTest.json create mode 100644 kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/REPORTING_DATA/reportingdata.csv create mode 100644 kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/REPORTING_DATA/reportingdata.xml diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/data/model/ExternalVariable.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/data/model/ExternalVariable.java index 23f2b5cd..85f0afd9 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/data/model/ExternalVariable.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/data/model/ExternalVariable.java @@ -1,13 +1,16 @@ package fr.insee.kraftwerk.core.data.model; import lombok.Getter; +import lombok.Setter; import java.util.List; public class ExternalVariable { @Getter + @Setter private String idVar; @Getter + @Setter private List values; } diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBIndingsSequenceGenesisTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBIndingsSequenceGenesisTest.java new file mode 100644 index 00000000..5472f7c0 --- /dev/null +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/sequence/BuildBIndingsSequenceGenesisTest.java @@ -0,0 +1,98 @@ +package fr.insee.kraftwerk.core.sequence; + +import fr.insee.kraftwerk.core.Constants; +import fr.insee.kraftwerk.core.TestConstants; +import fr.insee.kraftwerk.core.data.model.ExternalVariable; +import fr.insee.kraftwerk.core.data.model.Mode; +import fr.insee.kraftwerk.core.data.model.SurveyUnitUpdateLatest; +import fr.insee.kraftwerk.core.data.model.VariableState; +import fr.insee.kraftwerk.core.metadata.Group; +import fr.insee.kraftwerk.core.metadata.MetadataModel; +import fr.insee.kraftwerk.core.metadata.Variable; +import fr.insee.kraftwerk.core.metadata.VariableType; +import fr.insee.kraftwerk.core.utils.files.FileSystemImpl; +import fr.insee.kraftwerk.core.vtl.VtlBindings; +import org.junit.jupiter.api.BeforeAll; +import org.junit.jupiter.api.Test; + +import java.nio.file.Path; +import java.util.ArrayList; +import java.util.HashMap; +import java.util.List; +import java.util.Map; + +import static org.junit.Assert.assertThrows; +import static org.junit.jupiter.api.Assertions.assertDoesNotThrow; + +class BuildBIndingsSequenceGenesisTest { + private static final List surveyUnits = new ArrayList<>(); + + @BeforeAll + static void init(){ + String dataMode = "WEB"; + //Create one document + surveyUnits.clear(); + SurveyUnitUpdateLatest surveyUnitUpdateLatest = new SurveyUnitUpdateLatest(); + surveyUnitUpdateLatest.setIdUE("0000001"); + surveyUnitUpdateLatest.setIdCampaign("TESTCAMPAIGN"); + surveyUnitUpdateLatest.setIdQuest("TESTQUEST"); + surveyUnitUpdateLatest.setMode(Mode.valueOf(dataMode)); + + surveyUnitUpdateLatest.setVariablesUpdate(new ArrayList<>()); + VariableState variableState = new VariableState(); + variableState.setIdVar("COLLVAR1"); + variableState.setIdLoop(Constants.ROOT_GROUP_NAME); + variableState.setValues(new ArrayList<>()); + variableState.getValues().add("TEST1"); + surveyUnitUpdateLatest.getVariablesUpdate().add(variableState); + variableState = new VariableState(); + variableState.setIdVar("COLLVAR2"); + variableState.setIdLoop("LOOP1"); + variableState.setIdParent(Constants.ROOT_GROUP_NAME); + variableState.setValues(new ArrayList<>()); + variableState.getValues().add("TEST3"); + surveyUnitUpdateLatest.getVariablesUpdate().add(variableState); + + surveyUnitUpdateLatest.setExternalVariables(new ArrayList<>()); + ExternalVariable externalVariable = new ExternalVariable(); + externalVariable.setIdVar("EXTVAR1"); + externalVariable.setValues(new ArrayList<>()); + externalVariable.getValues().add("TEST2"); + surveyUnitUpdateLatest.getExternalVariables().add(externalVariable); + + surveyUnits.add(surveyUnitUpdateLatest); + } + + @Test + void buildVtlBindings_errorWithoutMetadata(){ + //GIVEN + String dataMode = "WEB"; + + VtlBindings vtlBindings = new VtlBindings(); + BuildBindingsSequenceGenesis bbsg = new BuildBindingsSequenceGenesis(new FileSystemImpl()); + //WHEN + THEN + assertThrows(NullPointerException.class, () -> bbsg.buildVtlBindings(dataMode, vtlBindings, null, surveyUnits, null)); + + } + + @Test + void buildVtlBindings_success(){ + //GIVEN + String dataMode = "WEB"; + + VtlBindings vtlBindings = new VtlBindings(); + BuildBindingsSequenceGenesis bbsg = new BuildBindingsSequenceGenesis(new FileSystemImpl()); + MetadataModel metadata = new MetadataModel(); + metadata.getVariables().putVariable(new Variable("COLLVAR1", metadata.getRootGroup(), VariableType.STRING)); + Group group = new Group("TESTLOOP",Constants.ROOT_GROUP_NAME); + metadata.getVariables().putVariable(new Variable("COLLVAR2", group, VariableType.STRING)); + metadata.getVariables().putVariable(new Variable("EXTVAR1", metadata.getRootGroup(), VariableType.STRING)); + metadata.getGroups().put("TESTLOOP", group); + Map modeMetadataMap = new HashMap<>(); + modeMetadataMap.put(dataMode,metadata); + + //WHEN + THEN + assertDoesNotThrow(() -> bbsg.buildVtlBindings(dataMode, vtlBindings, modeMetadataMap, surveyUnits, + Path.of(TestConstants.UNIT_TESTS_DIRECTORY, "genesis"))); + } +} diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/SqlUtilsTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/SqlUtilsTest.java index fc606c17..b5fdeec4 100644 --- a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/SqlUtilsTest.java +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/SqlUtilsTest.java @@ -15,6 +15,9 @@ import org.junit.jupiter.api.BeforeAll; import org.junit.jupiter.api.Test; +import java.io.IOException; +import java.nio.file.FileSystemException; +import java.nio.file.Files; import java.nio.file.Path; import java.sql.Connection; import java.sql.ResultSet; @@ -186,6 +189,28 @@ void getTableNamesTest() throws SQLException { } } + @Test + void openConnection_file_test() throws SQLException, IOException { + Path filePath = Path.of(TestConstants.UNIT_TESTS_DIRECTORY,"sql","testdb.duckdb"); + try(Connection testDatabaseFile = SqlUtils.openConnection(filePath)) { + Assertions.assertThat(testDatabaseFile).isNotNull(); + + Statement testDatabaseStatement = testDatabaseFile.createStatement(); + //Given + testDatabaseStatement.execute("CREATE TABLE testtable1(testint1 INT, teststring1 NVARCHAR)"); + testDatabaseStatement.execute("CREATE TABLE testtable2(testint2 INT, teststring2 NVARCHAR)"); + + //When + List tableNames = SqlUtils.getTableNames(testDatabaseStatement); + + //Then + Assertions.assertThat(tableNames).contains("testtable1","testtable2"); + testDatabaseStatement.close(); + } + Files.deleteIfExists(filePath); + Files.deleteIfExists(filePath.getParent().resolve(filePath.getFileName()+".wal")); + } + @AfterAll diff --git a/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/log/KraftwerkExecutionLogTest.java b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/log/KraftwerkExecutionLogTest.java new file mode 100644 index 00000000..ac181309 --- /dev/null +++ b/kraftwerk-core/src/test/java/fr/insee/kraftwerk/core/utils/log/KraftwerkExecutionLogTest.java @@ -0,0 +1,35 @@ +package fr.insee.kraftwerk.core.utils.log; + +import org.assertj.core.api.Assertions; +import org.junit.jupiter.api.Test; + +import java.text.SimpleDateFormat; +import java.time.LocalDateTime; +import java.time.ZoneOffset; +import java.util.ArrayList; +import java.util.HashMap; + +class KraftwerkExecutionLogTest { + @Test + void getFormattedString_test(){ + //GIVEN + KraftwerkExecutionLog kraftwerkExecutionLog = new KraftwerkExecutionLog(); + SimpleDateFormat simpleDateFormat = new SimpleDateFormat("dd/MM/yyyy HH:mm:ss.SSS"); + long start = LocalDateTime.now().toEpochSecond(ZoneOffset.UTC); + long stop = LocalDateTime.now().toEpochSecond(ZoneOffset.UTC); + + kraftwerkExecutionLog.setStartTimeStamp(start); + kraftwerkExecutionLog.setEndTimeStamp(stop); + kraftwerkExecutionLog.setOkFileNames(new ArrayList<>()); + kraftwerkExecutionLog.setLineCountByTableMap(new HashMap<>()); + + kraftwerkExecutionLog.getOkFileNames().add("TEST.xml"); + kraftwerkExecutionLog.getLineCountByTableMap().put("RACINE",1); + + //WHEN + String formattedString = kraftwerkExecutionLog.getFormattedString(); + + //THEN + Assertions.assertThat(formattedString).contains("TEST.xml", "RACINE", simpleDateFormat.format(start), simpleDateFormat.format(stop)); + } +} diff --git a/kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/PARADATA/paradataTest.json b/kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/PARADATA/paradataTest.json new file mode 100644 index 00000000..e18b95b2 --- /dev/null +++ b/kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/PARADATA/paradataTest.json @@ -0,0 +1,159 @@ +{ + "idSu": "0000001", + "events": [ + [ + { + "idSurveyUnit": "0000001", + "typeParadataObject": "orchestrator", + "idOrchestrator": "orchestrator-collect", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "page": "validationPage", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "click", + "idParadataObject": "validate-button-orchestrator-collect", + "timestamp": 1645807734894 + }, + { + "idSurveyUnit": "0000001", + "typeParadataObject": "orchestrator", + "idOrchestrator": "orchestrator-collect", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "page": "validationPage", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "click", + "idParadataObject": "agree-sending-modal-button-orchestrator-collect", + "timestamp": 1645807741929 + } + ], + [ + { + "idSurveyUnit": "0000001", + "typeParadataObject": "session", + "idOrchestrator": "orchestrator-collect", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "session-started", + "idParadataObject": "init-session", + "timestamp": 1645807624027 + }, + { + "idSurveyUnit": "0000001", + "typeParadataObject": "orchestrator", + "idOrchestrator": "orchestrator-collect", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "orchestrator-create", + "idParadataObject": "init-orchestrator-collect", + "timestamp": 1645807624458 + }, + { + "idSurveyUnit": "0000001", + "typeParadataObject": "orchestrator", + "idOrchestrator": "orchestrator-collect", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "page": "welcomePage", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "click", + "idParadataObject": "next-button-orchestrator-collect", + "timestamp": 1645807637176 + }, + { + "idSurveyUnit": "0000001", + "typeParadataObject": "orchestrator", + "idOrchestrator": "orchestrator-collect", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "page": "1", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "click", + "idParadataObject": "next-button-orchestrator-collect", + "timestamp": 1645807674779 + } + ], + [ + { + "idSurveyUnit": "0000001", + "typeParadataObject": "lunatic-input", + "idOrchestrator": "orchestrator-collect", + "responseName": "CADR", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "page": "1", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "selection", + "value": "3", + "idParadataObject": "radio-kb9hlpdc-3", + "timestamp": 1645807679901 + }, + { + "idSurveyUnit": "0000001", + "typeParadataObject": "orchestrator", + "idOrchestrator": "orchestrator-collect", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "page": "2", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "click", + "idParadataObject": "next-button-orchestrator-collect", + "timestamp": 1645807684715 + }, + { + "idSurveyUnit": "0000001", + "typeParadataObject": "lunatic-input", + "idOrchestrator": "orchestrator-collect", + "responseName": "INDNVOCC", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "page": "2", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "selection", + "value": "2", + "idParadataObject": "radio-kqweh61i-2", + "timestamp": 1645807690025 + }, + { + "idSurveyUnit": "0000001", + "typeParadataObject": "orchestrator", + "idOrchestrator": "orchestrator-collect", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "page": "4", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "click", + "idParadataObject": "next-button-orchestrator-collect", + "timestamp": 1645807691450 + }, + { + "idSurveyUnit": "0000001", + "typeParadataObject": "orchestrator", + "idOrchestrator": "orchestrator-collect", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "page": "184", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "click", + "idParadataObject": "next-button-orchestrator-collect", + "timestamp": 1645807730751 + } + ], + [ + { + "idSurveyUnit": "0000001", + "typeParadataObject": "orchestrator", + "idOrchestrator": "orchestrator-collect", + "idQuestionnaire": "TESTQUEST", + "userAgent": "Mozilla/5.0 (Windows NT 10.0; Win64; x64) AppleWebKit/537.36 (KHTML, like Gecko) Chrome/98.0.4758.102 Safari/537.36", + "page": "endPage", + "idSession": "593d88e6-3f11-49a2-9727-92a8e13fb39f", + "type": "click", + "idParadataObject": "logout-close-button-orchestrator-collect", + "timestamp": 1645807759129 + } + ] + ] +} \ No newline at end of file diff --git a/kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/REPORTING_DATA/reportingdata.csv b/kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/REPORTING_DATA/reportingdata.csv new file mode 100644 index 00000000..ffea39f6 --- /dev/null +++ b/kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/REPORTING_DATA/reportingdata.csv @@ -0,0 +1,2 @@ +statut,dateInfo,idUe,idContact,nom,prenom,adresse,numeroDeLot +INITLA,14/02/2022 14:35:34,0000001,XXXXXXX,NAME,FirstName,13 rue du Général hulot Insee Grand Est 54042 - Nancy cedex,99 \ No newline at end of file diff --git a/kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/REPORTING_DATA/reportingdata.xml b/kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/REPORTING_DATA/reportingdata.xml new file mode 100644 index 00000000..af9cc6e8 --- /dev/null +++ b/kraftwerk-core/src/test/resources/unit_tests/genesis/WEB/REPORTING_DATA/reportingdata.xml @@ -0,0 +1,155 @@ + + + TESTCAMPAIGN + + + 1686292973000 + 1688884973000 + + + + + 0000001 + E9LC05 + OU-TEST1 + false + + M. TEST TESTMAN + + + 1 AVENUE DES TESTS + + 01000 TESTVILLE + + + + + false + false + + + 0 + 0 + 0 + 1 + 202 + 11 + 1 + 0 + 0 + + 0 + + + + Mister + TEST + TESTMAN + toto@titi.fr + true + false + 01/01/1970 + + + 06000000 + interviewer + true + + + + + + + NVM + 1686306249642 + + + ANV + 1686306426503 + + + VIN + 1686306436167 + + + FIN + 1686749244026 + + + VIC + 1686313807830 + + + PRC + 1686313812283 + + + INS + 1686314711901 + + + WFT + 1686315212517 + + + AOC + 1686315494389 + + + APS + 1686315494390 + + + WFT + 1686315494391 + + + INS + 1686315520098 + + + WFT + 1686315525950 + + + APS + 1686315539138 + + + WFT + 1686315539139 + + + WFS + 1686315551319 + + + TBR + 1686315557403 + + + + + INTERVIEWER + ras + + + MANAGEMENT + + + + + INA + 1686315536222 + 1 + + + + INA + TEL + 1686315468266 + + + + + From 2ac3b784aebfa72b1e6647bd385c6942886c95c2 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 12 Jul 2024 14:55:47 +0200 Subject: [PATCH 42/46] Update README.md --- README.md | 23 +++++++++++++++++++++++ 1 file changed, 23 insertions(+) diff --git a/README.md b/README.md index 4d2622b7..50b437fb 100644 --- a/README.md +++ b/README.md @@ -21,6 +21,18 @@ User documentation and functional tests are still in an [inhouse project](https: Kraftwerk uses [Lombok](https://projectlombok.org/). +## Launch + +If no argument is specified in the `java -jar` command, Kraftwerk will launch +as a REST API. +Otherwise, it will launch on batch mode and apply treatments on one campaign +with the specified arguments. +The required arguments for batch mode are as follows (in order) : +1. Service to use (`MAIN`,`FILEBYFILE`,`GENESIS`,`LUNATIC_ONLY`) +2. Archive at end of execution (`false` or `true`) +3. Integrate all reporting datas (`false` or `true`) +4. Campaign name + :fr: Kraftwerk est une application Java Spring conçue pour valider et traiter des données provenant d'enquêtes multimodes, afin de générer des tableaux de données prêts à être utilisés à des fins statistiques. @@ -37,3 +49,14 @@ La documentation utilisateur et les tests fonctionnels sont encore dans un [proj * Maven 3.6 + Kraftwerk utilise [Lombok](https://projectlombok.org/). + +## Lancement + +Si aucun paramètre n'est spécifié dans la commande `java -jar`, Kraftwerk se lancera +en tant qu'API REST. +Sinon, il va se lancer en mode batch et appliquer les traitements sur une campagne +avec les paramètres spécifiés. Les paramètres requis pour le mode batch sont les suivants (dans l'ordre) : +1. Service à utiliser (`MAIN`,`FILEBYFILE`,`GENESIS`,`LUNATIC_ONLY`) +2. Archiver à la fin de l'exécution (`false` ou `true`) +3. Integrate all reporting datas (`false` ou `true`) +4. Nom de la campagne \ No newline at end of file From 305845bde8f824af2adfc8c35597e19e7375faa9 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Fri, 12 Jul 2024 15:00:19 +0200 Subject: [PATCH 43/46] Update Dockerfile --- Dockerfile | 4 ++-- 1 file changed, 2 insertions(+), 2 deletions(-) diff --git a/Dockerfile b/Dockerfile index c084c8f5..673500f9 100644 --- a/Dockerfile +++ b/Dockerfile @@ -1,7 +1,7 @@ # Java 21 FROM gitlab-registry.insee.fr:443/kubernetes/images/run/jre:21.0.1_12-jre-jammy-rootless -ARG VERSION_KRAFTWERK -COPY --chown=$JAVA_USER:$JAVA_USER Kraftwerk/kraftwerk-api/target/kraftwerk-api-$VERSION_KRAFTWERK.jar kraftwerk.jar +ARG VERSION_APPLICATION +COPY --chown=$JAVA_USER:$JAVA_USER Kraftwerk/kraftwerk-api/target/kraftwerk-api-$VERSION_APPLICATION.jar kraftwerk.jar EXPOSE 8080 From da58c6ad4606bf4922a460f253622573bdf3e042 Mon Sep 17 00:00:00 2001 From: QDIBYS Date: Mon, 15 Jul 2024 08:23:07 +0200 Subject: [PATCH 44/46] Added args in comments --- .../java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java | 4 ++++ 1 file changed, 4 insertions(+) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java index 19927942..cd199d59 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/batch/KraftwerkBatch.java @@ -47,6 +47,10 @@ public void run(String... args) { checkArgs(args); //Parse arguments + //0. Service to use (MAIN,FILEBYFILE,GENESIS,LUNATIC_ONLY) + //1. Archive at end of execution (false or true) + //2. Integrate all reporting datas (false or true) + //3. Campaign name KraftwerkServiceType kraftwerkServiceType = KraftwerkServiceType.valueOf(args[0]); boolean archiveAtEnd = Boolean.parseBoolean(args[1]); boolean withAllReportingData = Boolean.parseBoolean(args[2]); From 57ad15992ce1030cae8c8b58b11feee336f2f05e Mon Sep 17 00:00:00 2001 From: Alice Lambois Date: Tue, 16 Jul 2024 15:03:40 +0200 Subject: [PATCH 45/46] Fix missing import --- .../insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java | 1 + 1 file changed, 1 insertion(+) diff --git a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java index 55c379ea..33640c30 100644 --- a/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java +++ b/kraftwerk-core/src/main/java/fr/insee/kraftwerk/core/outputs/parquet/ParquetOutputFiles.java @@ -16,6 +16,7 @@ import java.nio.file.Path; import java.sql.Statement; import java.util.ArrayList; +import java.util.HashMap; import java.util.List; import java.util.Map; import java.util.stream.Collectors; From 476beb41237c64c2bab06a2b537a121c8dd0a401 Mon Sep 17 00:00:00 2001 From: Alice Lambois Date: Tue, 16 Jul 2024 15:08:32 +0200 Subject: [PATCH 46/46] Update HealthcheckService.java --- .../fr/insee/kraftwerk/api/services/HealthcheckService.java | 3 ++- 1 file changed, 2 insertions(+), 1 deletion(-) diff --git a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/HealthcheckService.java b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/HealthcheckService.java index 3dc61a99..9ea54933 100644 --- a/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/HealthcheckService.java +++ b/kraftwerk-api/src/main/java/fr/insee/kraftwerk/api/services/HealthcheckService.java @@ -32,7 +32,8 @@ public class HealthcheckService extends KraftwerkService { @Autowired public HealthcheckService(ConfigProperties configProperties) { - this.configProperties = configProperties; + super(null); + this.configProperties = configProperties; this.client = new GenesisClient(new RestTemplateBuilder(), configProperties); }