hozana
diff --git a/‎compose.yaml
Lines changed: 1 addition & 0 deletions b/‎compose.yaml
Lines changed: 1 addition & 0 deletions
diff --git a/‎composer.json
Lines changed: 1 addition & 0 deletions b/‎composer.json
Lines changed: 1 addition & 0 deletions
diff --git a/‎composer.lock
Lines changed: 62 additions & 1 deletion b/‎composer.lock
Lines changed: 62 additions & 1 deletion
diff --git a/‎config/packages/cache.yaml
Lines changed: 14 additions & 14 deletions b/‎config/packages/cache.yaml
Lines changed: 14 additions & 14 deletions
diff --git a/‎config/services.yaml
Lines changed: 6 additions & 0 deletions b/‎config/services.yaml
Lines changed: 6 additions & 0 deletions
diff --git a/‎scripts/synchro.py
Lines changed: 91 additions & 61 deletions b/‎scripts/synchro.py
Lines changed: 91 additions & 61 deletions
diff --git a/‎src/Core/Infrastructure/Redis/RedisClient.php
Lines changed: 21 additions & 0 deletions b/‎src/Core/Infrastructure/Redis/RedisClient.php
Lines changed: 21 additions & 0 deletions
@@ -64,6 +64,7 @@ services:
       APP_ENV: dev
       APP_SECRET: "secret"
       DATABASE_URL: mysql://root:openchurch@db:3306/openchurch?serverVersion=11.5.2-MariaDB&charset=utf8mb4
+      REDIS_URL: redis://redis:6379
       HOST_API: https://api.openchurch.local/api
       HOST_ADMIN: admin.openchurch.local
       ELASTIC_PASSWORD: admin
 
@@ -19,6 +19,7 @@
     "nelmio/cors-bundle": "^2.5",
     "phpdocumentor/reflection-docblock": "^5.4",
     "phpstan/phpdoc-parser": "^1.32",
+    "predis/predis": "^2.3",
     "symfony/asset": "7.1.*",
     "symfony/asset-mapper": "7.1.*",
     "symfony/console": "7.1.*",
 
@@ -1,19 +1,19 @@
 framework:
-    cache:
-        # Unique name of your app: used to compute stable namespaces for cache keys.
-        #prefix_seed: your_vendor_name/app_name
+  cache:
+    # Unique name of your app: used to compute stable namespaces for cache keys.
+    #prefix_seed: your_vendor_name/app_name
 
-        # The "app" cache stores to the filesystem by default.
-        # The data in this cache should persist between deploys.
-        # Other options include:
+    # The "app" cache stores to the filesystem by default.
+    # The data in this cache should persist between deploys.
+    # Other options include:
 
-        # Redis
-        #app: cache.adapter.redis
-        #default_redis_provider: redis://localhost
+    # Redis
+    app: cache.adapter.redis
+    default_redis_provider: "%env(REDIS_URL)%"
 
-        # APCu (not recommended with heavy random-write workloads as memory fragmentation can cause perf issues)
-        #app: cache.adapter.apcu
+    # APCu (not recommended with heavy random-write workloads as memory fragmentation can cause perf issues)
+    #app: cache.adapter.apcu
 
-        # Namespaced pools use the above "app" backend by default
-        #pools:
-            #my.dedicated.cache: null
+    # Namespaced pools use the above "app" backend by default
+    #pools:
+    #my.dedicated.cache: null
@@ -21,6 +21,12 @@ services:
       - "../src/Entity/"
       - "../src/Kernel.php"
 
+  app.predis_client:
+    class: Predis\Client
+    arguments:
+      - "%env(REDIS_URL)%"
+  Predis\Client: "@app.predis_client"
+
   # add more service definitions when explicit configuration is needed
   # please note that last definitions always *replace* previous ones
 
 
@@ -168,7 +168,7 @@ def fetch(self, file_name, query):
         sparql.setReturnFormat(JSON)
 
         with open(file_name, 'w', encoding='utf-8') as f:
-            f.write('[')  # Début du tableau JSON
+            f.write('[')
             first_batch = True
             while True:
                 try:
@@ -177,24 +177,22 @@ def fetch(self, file_name, query):
                     data = sparql.query().convert()
 
                     results = data['results']['bindings']
-                    if not results:  # Si aucun résultat, arrêter la boucle
+                    if not results:  # if no result, we stop the loop
                         break
 
-                    # Ajouter les résultats au fichier
+                    # add data to file
                     for result in results:
                         if not first_batch:
-                            f.write(',')  # Ajouter une virgule entre les objets JSON
+                            f.write(',')
                         json.dump(result, f, ensure_ascii=False)
                         first_batch = False
-
                     offset += batch_size
-
                 except Exception as e:
-                    print(f"Échec du chargement des données entre {offset} et {offset + batch_size}: {e}")
-                    break
+                    print(f"Failed to load data from {offset} to {offset + batch_size}: {e}")
+                offset += batch_size
             f.write(']')  # Fin du tableau JSON
 
-        print(f'Données écrites dans le fichier {file_name}.')
+        print(f'Data written in {file_name}.')
         with open(file_name, 'r', encoding='utf-8') as content_file:
             return json.loads(content_file.read())
 
@@ -414,67 +412,99 @@ def populate_fields(self, values, wikidata_id):
                     'explanation': 'https://www.wikidata.org/wiki/Q'+format(wikidata_id),
                 })
         return fields
+    
+class Processor(object):
+    client = OpenChurchClient()
+    q = Query()
+    redis_url = os.getenv('REDIS_URL')
+    redis_client = redis.from_url(redis_url)
+    verbosity_level = 0
+    type = 'diocece'
+    batch_size = 100
+
+    def process_batch(self, data, method, run_id):
+        batches = Query.split_into_batches(data, self.batch_size)
+        self.redis_client.hset(self.type, "batchCount", len(batches))
+        iteration = 1
+        for batch in batches:
+            can_process = True
+            self.redis_client.hset(self.type, "currentBatch", iteration)
+            key_batch = get_redis_key(self.type, (iteration - 1) * self.batch_size, (iteration) * self.batch_size)
+            value_batch = self.redis_client.hgetall(key_batch)
+            if value_batch:
+                # A key exist. We chek if we can process it
+                decoded_data = {key.decode('utf-8'): value_batch.decode('utf-8') for key, value_batch in value_batch.items()}
+                current_run_id = decoded_data.get('runId')
+                if current_run_id == run_id:
+                    can_process = False # This have already been processed. We skip it
+            if can_process:
+                self.redis_client.hset(key_batch, "status", "processing")
+                self.redis_client.hset(key_batch, "updatedAt", str(datetime.now()))
+                self.redis_client.hset(key_batch, "runId", run_id)
+                print("Processing batch %s/%s" % (iteration, len(batches)))
+                res = getattr(self.q, method)(batch, self.client)
+                if res:
+                    success_count = sum(1 for value in res.values() if value in {'Updated', 'Inserted'})
+                    self.redis_client.hset(key_batch, "successCount", success_count)
+                    self.redis_client.hset(key_batch, "failureCount", len(res) - success_count)
+                    self.redis_client.hset(key_batch, "status", "success")
+                else:
+                    self.redis_client.hset(key_batch, "status", "error")
+            else:
+                print("Ignore batch %s/%s" % (iteration, len(batches)))
+            iteration += 1
+
+    def process_entity(self):
+        print("starting synchro for", self.type)
+        if self.type == "diocese":
+            data = self.q.fetch('wikidata_dioceses.json', dioceses_query)
+            method = "update_dioceses"
+        elif self.type == "parish":
+            data = self.q.fetch('wikidata_parishes.json', parishes_query)
+            method = "update_parishes"
+        elif self.type == "church":
+            data = self.q.fetch('wikidata_churches.json', churches_query)
+            method = "update_churches"
+        else:
+            raise("Unknown entity type %s" % self.type)
+        
+        value_entity = self.redis_client.hgetall(self.type)
+        if value_entity:
+            decoded_data = {key.decode('utf-8'): value_entity.decode('utf-8') for key, value_entity in value_entity.items()}
+            run_id = decoded_data.get('runId')
+            if decoded_data.get('status') in {'processing'}:
+                self.process_batch(data, method, run_id)
+            else:
+                self.clean_entity(int(run_id) + 1)
+                self.process_batch(data, method, run_id)
+        else:
+            self.clean_entity(1)
+            self.process_batch(data, method, 1)
+
+        self.redis_client.hset(self.type, "status", "success")
+        self.redis_client.hset(self.type, "endDate", str(datetime.now()))
+        print("ended synchro for", self.type)
+
+    def clean_entity(self, run_id):
+        self.redis_client.hset(self.type, "runId", run_id)
+        self.redis_client.hset(self.type, "startDate", str(datetime.now()))
+        self.redis_client.hset(self.type, "status", "processing")
+        self.redis_client.hset(self.type, "batchSize", self.batch_size)
+        self.redis_client.hdel(self.type, "endDate")
 
 def percentage(num, total):
     return '%s = %s%%' % (num, (round(100 * num / total, 2)))
 
 def get_redis_key(type, origin, to):
     return '%s_%s-%s' % (type, origin, to)
 
-def process_entity(type, batch_size, verbosity_level):
-    redis_url = os.getenv('REDIS_URL')
-    redis_client = redis.from_url(redis_url)
-    q = Query()
-    q.verbosity_level = verbosity_level
-    client = OpenChurchClient()
-
-    print("starting synchro for", type)
-    if type == "diocese":
-        data = q.fetch('wikidata_dioceses.json', dioceses_query)
-        method = "update_dioceses"
-    elif type == "parish":
-        data = q.fetch('wikidata_parishes.json', parishes_query)
-        method = "update_parishes"
-    elif type == "church":
-        data = q.fetch('wikidata_churches.json', churches_query)
-        method = "update_churches"
-    else:
-        raise("Type d'entité non reconnu")
-    
-    batches = Query.split_into_batches(data, batch_size)
-    iteration = 1
-    for batch in batches:
-        can_process = True
-        key = get_redis_key(type, iteration - 1, len(batch))
-        value = redis_client.hgetall(key)
-        if value:
-            # A key exist. We chek if we can process it
-            decoded_data = {key.decode('utf-8'): value.decode('utf-8') for key, value in value.items()}
-            if decoded_data.get('status') in {'success', 'error'}:
-                time_diff = datetime.now() - datetime.strptime(decoded_data.get('updatedAt'), "%Y-%m-%d %H:%M:%S.%f")
-                if time_diff <= timedelta(minutes=30):
-                    can_process = False # We updated the batch less than 30 minutes ago. We skip it
-
-        if can_process:
-            redis_client.hset(key, "status", "processing")
-            redis_client.hset(key, "updatedAt", str(datetime.now()))
-            print("Processing batch %s/%s" % (iteration, len(batches) + 1))
-            res = getattr(q, method)(batch, client)
-            if res:
-                success_count = sum(1 for value in res.values() if value in {'Updated', 'Inserted'})
-                redis_client.hset(key, "successCount", success_count)
-                redis_client.hset(key, "failureCount", len(res) - success_count)
-                redis_client.hset(key, "status", "success")
-            else:
-                redis_client.hset(key, "status", "error")
-        else:
-            print("Ignore batch %s/%s" % (iteration, len(batches) + 1))
-        iteration += 1
-    print("ended synchro for", type)
-
 if __name__ == '__main__':
     parser = argparse.ArgumentParser()
     parser.add_argument("--entity-only", type=str, required=True, choices=["parish", "diocese", "church"], help="Spécifiez l'entité à traiter : 'diocese', 'parish' ou 'church'")
     parser.add_argument("-v", "--verbose", action="count", default=0, help="Augmente le niveau de verbosité (utilisez -vvv pour plus de détails).")
     args = parser.parse_args()
-    process_entity(args.entity_only, 100, args.verbose)
+
+    processor = Processor()
+    processor.verbosity_level = args.verbose
+    processor.type = args.entity_only
+    processor.process_entity()
@@ -0,0 +1,21 @@
+<?php
+
+namespace App\Core\Infrastructure\Redis;
+
+use Predis\Client;
+
+class RedisClient
+{
+    public function __construct(
+        public Client $client,
+    ) {
+    }
+
+    /**
+     * @return array<mixed>
+     */
+    public function getHash(string $key): array
+    {
+        return $this->client->hgetall($key);
+    }
+}