il y a 4 ans · 6561a67ebd
--- a/back.Dockerfile
+++ b/back.Dockerfile
@@ -8,6 +8,11 @@ WORKDIR /usr/src/app
 
				 # Server port
			
 
				 EXPOSE 5000
			
 
				 
			
 
				+# Install python
			
 
				+RUN apk add --update --no-cache gcc gfortran python python-dev py-pip build-base wget freetype-dev libpng-dev openblas-dev
			
 
				+RUN pip install pymongo
			
 
				+RUN pip install numpy
			
 
				+
			
 
				 # Install dependencies and generate documentation
			
 
				 RUN yarn install && yarn doc
			
 
				 
			
@@ -17,6 +22,8 @@ CMD if [ "$SERVE_CLIENT" == "true" ] ; \
 
				     ([ -f ./experimentConfig.js ] && \
			
 
				       echo "Experiment configuration found" \
			
 
				       || (echo "Experiment configuration not found, copying default" && cp experimentConfig.default.js experimentConfig.js)) && \
			
 
				+    ([ -d ./results ] || mkdir results) && \
			
 
				+    ([ -f ./results/match_extracts_probs.json ] || echo "[]" >> results/match_extracts_probs.json) && \
			
 
				     NODE_ENV=test yarn test && \
			
 
				     yarn run app:build && \
			
 
				     yarn run server:start ; \
			
--- a/docker-compose.yml
+++ b/docker-compose.yml
@@ -34,6 +34,7 @@ services:
 
				             - mongo
			
 
				         volumes:
			
 
				             - "${IMAGES_PATH:-./images}:/usr/src/app/images"
			
 
				+            - "./results:/usr/src/app/results"
			
 
				             - "./logs:/usr/src/app/logs"
			
 
				         depends_on:
			
 
				             - mongo
			
--- a/expeStats.js
+++ b/expeStats.js
@@ -2,12 +2,19 @@
 
				 
			
 
				 // import { experiments } from './experimentConfig'
			
 
				 const config = require('./experimentConfig')
			
 
				-
			
 
				+const mongoose = require('mongoose')
			
 
				+const configApp = require('./config')
			
 
				+const mongoDatabaseURI = configApp.mongoDatabaseURI
			
 
				 const fs = require('fs-extra')
			
 
				 
			
 
				 const winston = require('winston')
			
 
				 const execSync = require('child_process').execSync
			
 
				 
			
 
				+// const connectDb = async () => {
			
 
				+//   await mongoose.connect(mongoDatabaseURI, { useNewUrlParser: true, useFindAndModify: false })
			
 
				+//   mongoose.connection.on('error', (err) => console.log(err))
			
 
				+// }
			
 
				+
			
 
				 // get whitelist scene for MatchExtractsWithReference experiment
			
 
				 const scenes = config.experiments.MatchExtractsWithReference.availableScenes.whitelist
			
 
				 
			
@@ -28,6 +35,8 @@ const fileLogger = winston.createLogger({
 
				 })
			
 
				 
			
 
				 const setup = async (logToFile = false) => {
			
 
				+  // await connectDb()
			
 
				+
			
 
				   if (logToFile) fileLogger.info({ log: 'Start extraction of data from mongo for `MatchExtractsExperiments`.', date: new Date() })
			
 
				 
			
 
				   execSync('python utils/extract_experiment.py', { encoding: 'utf-8' })
			
--- a/experimentConfig.default.js
+++ b/experimentConfig.default.js
@@ -55,40 +55,39 @@ export const experiments = {
 
				     availableScenes: {
			
 
				       whitelist: [
			
 
				         'p3d_arcsphere-view0_part6',
			
 
				-        'p3d_bunny-fur-view0_part6',
			
 
				         'p3d_car2-view0_part6',
			
 
				         'p3d_caustic-view0_part6',
			
 
				-        'p3d_chopper-titan-view0_part6',
			
 
				-        'p3d_coffee-splash-view0_part6',
			
 
				-        'p3d_cornel-box-view0_part6',
			
 
				         'p3d_crown-view0_part6',
			
 
				         'p3d_dragon-view0_part6',
			
 
				         'p3d_dragon_250-view0_part6',
			
 
				-        'p3d_ecosys-view0_part6',
			
 
				-        'p3d_eponge-fractal-5-view0_part6',
			
 
				-        'p3d_eponge-fractal-5-view1_part6',
			
 
				-        'p3d_eponge-fractal-6-view0_part6',
			
 
				         'p3d_eponge-fractal-6-view1_part6',
			
 
				         'p3d_ganesha-view0_part6',
			
 
				         'p3d_glass-of-water-view0_part6',
			
 
				         'p3d_indirect-view0_part6',
			
 
				-        'p3d_kitchen-view0_part6',
			
 
				         'p3d_landscape-view3_part6',
			
 
				-        'p3d_living-room-view0_part6',
			
 
				-        'p3d_living-room-view1_part6',
			
 
				-        'p3d_living-room-view2_part6',
			
 
				-        'p3d_low_table_upper_view0_part6',
			
 
				         'p3d_pavilion-day-view0_part6',
			
 
				         'p3d_pavilion-day-view1_part6',
			
 
				         'p3d_pavilion-day-view2_part6',
			
 
				         'p3d_pavilion-night-view0_part6',
			
 
				         'p3d_pavilion-night-view1_part6',
			
 
				         'p3d_pavilion-night-view2_part6',
			
 
				-        'p3d_sportscar-view0_part6',
			
 
				         'p3d_staircase-view1_part6',
			
 
				         'p3d_staircase2-view0_part6',
			
 
				         'p3d_tt-view0_part6',
			
 
				-        'p3d_vw-van-view0_part6'
			
 
				+        'p3d_vw-van-view0_part6',
			
 
				+        'p3d_low_table_2spheric_view0_part6',
			
 
				+        'p3d_bathroom-view0_part6',
			
 
				+        'p3d_classroom-view0_part6',
			
 
				+        'p3d_classroom-view1_part6',
			
 
				+        'p3d_contemporary-bathroom-view0_part6',
			
 
				+        'p3d_contemporary-bathroom-view1_part6',
			
 
				+        'p3d_glass-view0_part6',
			
 
				+        'p3d_kitchen-view0_part6',
			
 
				+        'p3d_kitchen-view1_part6',
			
 
				+        'p3d_living-room-3-view0_part6',
			
 
				+        'p3d_living-room-3-view1_part6',
			
 
				+        'p3d_sanmiguel-view1_part6',
			
 
				+        'p3d_sanmiguel-view2_part6'
			
 
				       ],
			
 
				       blacklist: null
			
 
				       // No whitelist = Select all scenes
			
--- a/utils/extract_experiment.py
+++ b/utils/extract_experiment.py
@@ -2,7 +2,7 @@
 
				 from pymongo import MongoClient
			
 
				 import json, os
			
 
				 
			
 
				-connection = MongoClient()
			
 
				+connection = MongoClient('mongodb://mongo:27017')
			
 
				 
			
 
				 db = connection['sin3d']
			
 
				 data_collection = db['datas']
			
--- a/utils/extract_stats_freq_and_min.py
+++ b/utils/extract_stats_freq_and_min.py
@@ -41,13 +41,20 @@ def main():
 
				             
			
 
				     
			
 
				     output_file = open(p_output, 'w')
			
 
				+    #output_file.write('scene;n_users;min_scene;\n')
			
 
				 
			
 
				     for scene in dict_data:
			
 
				         output_file.write(scene + ';')
			
 
				         
			
 
				+        all_thresholds = []
			
 
				+        n_users = 0
			
 
				         for extract in dict_data[scene]:
			
 
				             thresholds_data = dict_data[scene][extract]
			
 
				-            output_file.write(str(int(np.min(thresholds_data))) + ';')
			
 
				+            
			
 
				+            all_thresholds.append(int(np.min(thresholds_data)))
			
 
				+            n_users = len(thresholds_data)
			
 
				+
			
 
				+        output_file.write(str(n_users) + ';' + str(np.min(all_thresholds)) + ';')
			
 
				 
			
 
				         output_file.write('\n')
			
 
				 
			
--- a/utils/extract_stats_freq_mean_std.py
+++ b/utils/extract_stats_freq_mean_std.py
@@ -0,0 +1,68 @@
 
				+# main imports
			
 
				+import os, sys
			
 
				+import argparse
			
 
				+import json
			
 
				+import numpy as np
			
 
				+
			
 
				+
			
 
				+def main():
			
 
				+    """
			
 
				+    main function which is ran when launching script
			
 
				+    """ 
			
 
				+    parser = argparse.ArgumentParser(description="Extract scenes data and save thresholds into .csv")
			
 
				+
			
 
				+    parser.add_argument('--file', type=str, help='image to convert', required=True)
			
 
				+    parser.add_argument('--output', type=str, help='output csv filename', required=True)
			
 
				+    parser.add_argument('--freq', type=int, help='display user freq', choices=[0, 1], required=True)
			
 
				+
			
 
				+    args = parser.parse_args()
			
 
				+
			
 
				+    p_file   = args.file
			
 
				+    p_output = args.output
			
 
				+    p_freq = bool(args.freq)
			
 
				+
			
 
				+    f = open(p_file)
			
 
				+    json_data = json.load(f)
			
 
				+
			
 
				+    dict_data = {}
			
 
				+
			
 
				+    for element in json_data:
			
 
				+
			
 
				+        scene = element['msg']['sceneName']
			
 
				+
			
 
				+        if scene not in dict_data:
			
 
				+            dict_data[scene] = {}
			
 
				+
			
 
				+        extracts = element['msg']['extracts']
			
 
				+
			
 
				+        for extract in extracts:
			
 
				+            if extract['index'] not in dict_data[scene]:
			
 
				+                dict_data[scene][extract['index']] = [extract['quality']]
			
 
				+            else:
			
 
				+                dict_data[scene][extract['index']].append(extract['quality'])
			
 
				+            
			
 
				+    
			
 
				+    output_file = open(p_output, 'w')
			
 
				+    #output_file.write('scene;n_users;min_scene;\n')
			
 
				+
			
 
				+    for scene in dict_data:
			
 
				+        output_file.write(scene)
			
 
				+        
			
 
				+        all_thresholds = []
			
 
				+        n_users = 0
			
 
				+        for extract in dict_data[scene]:
			
 
				+            thresholds_data = dict_data[scene][extract]
			
 
				+            
			
 
				+            all_thresholds.append(int(np.mean(thresholds_data) + np.std(thresholds_data)))
			
 
				+            n_users = len(thresholds_data)
			
 
				+
			
 
				+        if p_freq:
			
 
				+            output_file.write(';' + str(n_users))
			
 
				+        else:
			
 
				+            for t in all_thresholds:
			
 
				+                output_file.write(';' + str(t))
			
 
				+
			
 
				+        output_file.write(';\n')
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    main()
			
--- a/utils/get_specific_dataset.py
+++ b/utils/get_specific_dataset.py
@@ -0,0 +1,222 @@
 
				+# main imports
			
 
				+import os, sys
			
 
				+import argparse
			
 
				+import json
			
 
				+import numpy as np
			
 
				+import shutil
			
 
				+
			
 
				+# Rawls images
			
 
				+from rawls.rawls import Rawls
			
 
				+
			
 
				+# others import
			
 
				+from ipfml import utils
			
 
				+from scipy.signal import savgol_filter
			
 
				+
			
 
				+'''
			
 
				+Display progress information as progress bar
			
 
				+'''
			
 
				+def write_progress(progress):
			
 
				+    barWidth = 180
			
 
				+
			
 
				+    output_str = "["
			
 
				+    pos = barWidth * progress
			
 
				+    for i in range(barWidth):
			
 
				+        if i < pos:
			
 
				+           output_str = output_str + "="
			
 
				+        elif i == pos:
			
 
				+           output_str = output_str + ">"
			
 
				+        else:
			
 
				+            output_str = output_str + " "
			
 
				+
			
 
				+    output_str = output_str + "] " + str(int(progress * 100.0)) + " %\r"
			
 
				+    print(output_str)
			
 
				+    sys.stdout.write("\033[F")
			
 
				+
			
 
				+
			
 
				+def extract_index(filepath):
			
 
				+
			
 
				+    return int(filepath.split('-')[-1].split('.')[0])
			
 
				+
			
 
				+
			
 
				+def extracts_linear_indices_rawls(images_path, n_expected=50, i_indices_step=20, o_indices_step=20, start_at=20, smooth_arr=False, gamma=False):
			
 
				+
			
 
				+    default_add = start_at - 20
			
 
				+
			
 
				+    # by default
			
 
				+    if i_indices_step == 1:
			
 
				+        default_add = 0
			
 
				+
			
 
				+    n_start_images = int(start_at / i_indices_step)
			
 
				+    n_counter = 0
			
 
				+    
			
 
				+    # extract variance for each image path
			
 
				+    var_arr = []
			
 
				+    prev_rawls = None
			
 
				+
			
 
				+    n_images = len(images_path)
			
 
				+
			
 
				+    for p in sorted(images_path):
			
 
				+        
			
 
				+        if prev_rawls is None:
			
 
				+            temp = Rawls.load(p)
			
 
				+            
			
 
				+            if gamma:
			
 
				+                temp.gammaConvert()
			
 
				+                
			
 
				+            prev_rawls = temp
			
 
				+        else:
			
 
				+            temp = Rawls.load(p)
			
 
				+            
			
 
				+            if gamma:
			
 
				+                temp.gammaConvert()
			
 
				+                
			
 
				+            prev_rawls = Rawls.fusion(prev_rawls, temp)
			
 
				+        
			
 
				+        write_progress((n_counter + 1) / n_images)
			
 
				+
			
 
				+        n_counter += 1
			
 
				+        
			
 
				+        if n_counter >= n_start_images:
			
 
				+            # only get center variance of image (800 per 800)
			
 
				+            width, heigth, _ = prev_rawls.shape
			
 
				+            n_w, n_h = (800, 800) # new expected size
			
 
				+
			
 
				+            # get center of image
			
 
				+            middle_w = int(width / 2)
			
 
				+            middle_h = int(heigth / 2)
			
 
				+
			
 
				+            # start coordinates
			
 
				+            s_w = middle_w - int(n_w / 2)
			
 
				+            s_h = middle_h - int(n_h / 2)
			
 
				+
			
 
				+            # end coordinates
			
 
				+            e_w = middle_w + int(n_w / 2)
			
 
				+            e_h = middle_h + int(n_h / 2)
			
 
				+
			
 
				+            var_arr.append(np.var(prev_rawls.data[s_w:e_w, s_h:e_h]))
			
 
				+        
			
 
				+    # normalize variance values
			
 
				+    norm_arr = np.array(utils.normalize_arr_with_range(var_arr))
			
 
				+    
			
 
				+    if smooth_arr:
			
 
				+        norm_arr = utils.normalize_arr_with_range(savgol_filter(norm_arr, 201, 3)) # window size 7, polynomial order 3
			
 
				+    
			
 
				+    # get expected linear step (using n_expectec output images)
			
 
				+    linear_steps = utils.normalize_arr_with_range((1 - (np.arange(n_expected) / n_expected)))
			
 
				+    
			
 
				+    # get image indices from variance convergence and linear
			
 
				+    # => when linear step is reached we store the index found from variance values
			
 
				+    
			
 
				+    indices_found = []
			
 
				+    for i in linear_steps: 
			
 
				+        find_index = len(linear_steps) - 1
			
 
				+        for index, y in enumerate(norm_arr):
			
 
				+            if i <= y:
			
 
				+                find_index = index
			
 
				+        indices_found.append(find_index + 1)
			
 
				+
			
 
				+    indices = np.array(indices_found) * i_indices_step
			
 
				+    
			
 
				+    # add tricks to avoid same indice
			
 
				+    # => when index is same as previous, then add number of samples expected by step 
			
 
				+    # Example with step of 20 : [20, 20, 20, 100, 200] => [20, 40, 60, 100, 200]
			
 
				+    final_indices = []
			
 
				+    for index, i in enumerate(indices):
			
 
				+        value = indices[index]
			
 
				+        if index > 0:
			
 
				+            if i <= indices[index - 1]:
			
 
				+                
			
 
				+                value = indices[index - 1] + o_indices_step
			
 
				+                indices[index] = value
			
 
				+
			
 
				+        final_indices.append(value)
			
 
				+
			
 
				+    return np.array(final_indices) + default_add
			
 
				+
			
 
				+
			
 
				+def main():
			
 
				+    """
			
 
				+    main function which is ran when launching script
			
 
				+    """ 
			
 
				+    parser = argparse.ArgumentParser(description="Compute new dataset scene")
			
 
				+
			
 
				+    parser.add_argument('--file', type=str, help='file data extracted from `utils/extract_stats_freq_and_min.py` script', required=True)
			
 
				+    parser.add_argument('--rawls_folder', type=str, help='rawls dataset folder with scene', required=True)
			
 
				+    parser.add_argument('--png_folder', type=str, help='png dataset folder with scene', required=True)
			
 
				+    parser.add_argument('--users', type=int, help='min number of users required per scene', required=True, default=10)
			
 
				+    parser.add_argument('--samples', type=int, help='expected samples to get for this dataset', required=True, default=10000)
			
 
				+    parser.add_argument('--output', type=str, help='output images folder', required=True)
			
 
				+
			
 
				+    args = parser.parse_args()
			
 
				+
			
 
				+    p_file   = args.file
			
 
				+    p_rawls_folder = args.rawls_folder
			
 
				+    p_png_folder = args.png_folder
			
 
				+    p_users  = args.users
			
 
				+    p_samples = args.samples
			
 
				+    p_output = args.output
			
 
				+
			
 
				+    with open(p_file, 'r') as f:
			
 
				+
			
 
				+        for line in f.readlines():
			
 
				+
			
 
				+            data = line.split(';')
			
 
				+
			
 
				+            scene = data[0]
			
 
				+            n_users = int(data[1])
			
 
				+            min_index = int(data[2])
			
 
				+
			
 
				+            # remove _partX from scene name
			
 
				+            scene_name = scene.split('_')[0] + '_' + scene.split('_')[1]
			
 
				+
			
 
				+            if n_users >= p_users:
			
 
				+                print('Extract custom indices based on minimum index for', scene)
			
 
				+
			
 
				+                rawls_folder_scene = os.path.join(p_rawls_folder, scene_name)
			
 
				+                png_folder_scene = os.path.join(p_png_folder, scene)
			
 
				+
			
 
				+                if not os.path.exists(rawls_folder_scene):
			
 
				+                    print(rawls_folder_scene, 'rawls folder does not exist')
			
 
				+                else:
			
 
				+                    
			
 
				+                    # get all rawls files
			
 
				+                    rawls_files = [ os.path.join(rawls_folder_scene, p) for p in sorted(os.listdir(rawls_folder_scene)) ]
			
 
				+
			
 
				+                    # extract step from these files
			
 
				+                    input_step = p_samples / len(rawls_files)
			
 
				+
			
 
				+                    print('Extract indices for', scene)
			
 
				+
			
 
				+                    # get indices using min index
			
 
				+                    indices = extracts_linear_indices_rawls(rawls_files, n_expected=50, i_indices_step=input_step, o_indices_step=20, start_at=min_index, smooth_arr=True, gamma=True)
			
 
				+
			
 
				+                    print('Indices found are', indices)
			
 
				+                    # create output directory
			
 
				+                    output_scene_dir = os.path.join(p_output, scene)
			
 
				+
			
 
				+                    if not os.path.exists(output_scene_dir):
			
 
				+                        os.makedirs(output_scene_dir)
			
 
				+
			
 
				+                    # get expected png image and move it
			
 
				+                    for index in indices:
			
 
				+
			
 
				+                        str_index = str(index)
			
 
				+
			
 
				+                        while len(str_index) < 5:
			
 
				+                            str_index = "0" + str_index
			
 
				+
			
 
				+                        image_name = scene + '_' + str_index + '.png'
			
 
				+                        png_image_path = os.path.join(png_folder_scene, image_name)
			
 
				+
			
 
				+                        # create output filepath
			
 
				+                        output_img_filepath = os.path.join(output_scene_dir, image_name)
			
 
				+
			
 
				+                        # copy expected image path
			
 
				+                        shutil.copy2(png_image_path, output_img_filepath)
			
 
				+            else:
			
 
				+                print('Only', n_users, 'users who passed the experiment for', scene)
			
 
				+    
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    main()
			
--- a/utils/get_specific_dataset_png.py
+++ b/utils/get_specific_dataset_png.py
@@ -0,0 +1,192 @@
 
				+# main imports
			
 
				+import os, sys
			
 
				+import argparse
			
 
				+import json
			
 
				+import numpy as np
			
 
				+import shutil
			
 
				+
			
 
				+# PNG images
			
 
				+from PIL import Image
			
 
				+
			
 
				+# others import
			
 
				+from ipfml import utils
			
 
				+from scipy.signal import savgol_filter
			
 
				+
			
 
				+'''
			
 
				+Display progress information as progress bar
			
 
				+'''
			
 
				+def write_progress(progress):
			
 
				+    barWidth = 180
			
 
				+
			
 
				+    output_str = "["
			
 
				+    pos = barWidth * progress
			
 
				+    for i in range(barWidth):
			
 
				+        if i < pos:
			
 
				+           output_str = output_str + "="
			
 
				+        elif i == pos:
			
 
				+           output_str = output_str + ">"
			
 
				+        else:
			
 
				+            output_str = output_str + " "
			
 
				+
			
 
				+    output_str = output_str + "] " + str(int(progress * 100.0)) + " %\r"
			
 
				+    print(output_str)
			
 
				+    sys.stdout.write("\033[F")
			
 
				+
			
 
				+
			
 
				+def extract_index(filepath):
			
 
				+
			
 
				+    return int(filepath.split('_')[-1].split('.')[0])
			
 
				+
			
 
				+
			
 
				+def extracts_linear_indices(images_path, n_expected=50, indices_step=20, start_at=20, smooth_arr=False):
			
 
				+
			
 
				+    # TODO : check this part
			
 
				+    default_add = start_at - indices_step
			
 
				+    
			
 
				+    # extract variance for each image path
			
 
				+    var_arr = []
			
 
				+
			
 
				+    n_counter = 0
			
 
				+    n_images = len(images_path)
			
 
				+
			
 
				+    for p in sorted(images_path):
			
 
				+        img = Image.open(p)
			
 
				+        var_arr.append(np.var(img))
			
 
				+
			
 
				+        n_counter += 1
			
 
				+        write_progress((n_counter + 1) / n_images)
			
 
				+        
			
 
				+    # normalize variance values
			
 
				+    norm_arr = np.array(utils.normalize_arr_with_range(var_arr))
			
 
				+    
			
 
				+    if smooth_arr:
			
 
				+        norm_arr = utils.normalize_arr_with_range(savgol_filter(norm_arr, 201, 3)) # window size 7, polynomial order 3
			
 
				+    
			
 
				+    # get expected linear step (using n_expectec output images)
			
 
				+    linear_steps = utils.normalize_arr_with_range((1 - (np.arange(n_expected) / n_expected)))
			
 
				+    
			
 
				+    # get image indices from variance convergence and linear
			
 
				+    # => when linear step is reached we store the index found from variance values
			
 
				+    indices_found = []
			
 
				+    for i in linear_steps: 
			
 
				+        
			
 
				+        find_index = 0
			
 
				+        
			
 
				+        for index, y in enumerate(norm_arr):
			
 
				+            if i <= y:
			
 
				+                find_index = index
			
 
				+
			
 
				+        indices_found.append(find_index + 1)
			
 
				+
			
 
				+    indices = np.array(indices_found) * indices_step
			
 
				+    
			
 
				+    # add tricks to avoid same indice
			
 
				+    # => when index is same as previous, then add number of samples expected by step 
			
 
				+    # Example with step of 20 : [20, 20, 20, 100, 200] => [20, 40, 60, 100, 200]
			
 
				+    final_indices = []
			
 
				+    for index, i in enumerate(indices):
			
 
				+        value = indices[index]
			
 
				+        if index > 0:
			
 
				+            if i <= indices[index - 1]:
			
 
				+                value = indices[index - 1] + indices_step
			
 
				+                indices[index] = value
			
 
				+
			
 
				+        final_indices.append(value)
			
 
				+        
			
 
				+    return np.array(final_indices) + default_add
			
 
				+
			
 
				+
			
 
				+def main():
			
 
				+    """
			
 
				+    main function which is ran when launching script
			
 
				+    """ 
			
 
				+    parser = argparse.ArgumentParser(description="Compute new dataset scene")
			
 
				+
			
 
				+    parser.add_argument('--file', type=str, help='file data extracted from `utils/extract_stats_freq_and_min.py` script', required=True)
			
 
				+    parser.add_argument('--png_folder', type=str, help='png dataset folder with scene', required=True)
			
 
				+    parser.add_argument('--users', type=int, help='min number of users required per scene', required=True, default=10)
			
 
				+    #parser.add_argument('--samples', type=int, help='expected samples to get for this dataset', required=True, default=10000)
			
 
				+    parser.add_argument('--output', type=str, help='output image folder', required=True)
			
 
				+
			
 
				+    args = parser.parse_args()
			
 
				+
			
 
				+    p_file   = args.file
			
 
				+    p_png_folder = args.png_folder
			
 
				+    p_users  = args.users
			
 
				+    #p_samples = args.samples
			
 
				+    p_output = args.output
			
 
				+
			
 
				+    with open(p_file, 'r') as f:
			
 
				+
			
 
				+        for line in f.readlines():
			
 
				+
			
 
				+            data = line.split(';')
			
 
				+
			
 
				+            scene = data[0]
			
 
				+            n_users = int(data[1])
			
 
				+            min_index = int(data[2])
			
 
				+
			
 
				+            # remove _partX from scene name
			
 
				+            scene_parts = scene.split('_')
			
 
				+            del scene_parts[-1]
			
 
				+            scene_name = '_'.join(scene_parts)
			
 
				+
			
 
				+            output_scene_dir = os.path.join(p_output, scene)
			
 
				+
			
 
				+            if os.path.exists(output_scene_dir):
			
 
				+                print('Extraction of custom indices already done for', scene)
			
 
				+                continue
			
 
				+
			
 
				+            if n_users >= p_users:
			
 
				+                print('Extract custom indices based on minimum index for', scene)
			
 
				+
			
 
				+                png_folder_scene = os.path.join(p_png_folder, scene)
			
 
				+
			
 
				+                if not os.path.exists(png_folder_scene):
			
 
				+                    print(png_folder_scene, 'png folder does not exist')
			
 
				+                else:
			
 
				+                    
			
 
				+                    # get all rawls files
			
 
				+                    png_files = [ os.path.join(png_folder_scene, p) for p in sorted(os.listdir(png_folder_scene)) ]
			
 
				+
			
 
				+                    # extract max samples found for this scene
			
 
				+                    _, filename = os.path.split(png_files[-1])
			
 
				+
			
 
				+                    max_samples = extract_index(filename)
			
 
				+
			
 
				+                    # extract step from these files
			
 
				+                    input_step = int(max_samples / len(png_files))
			
 
				+
			
 
				+                    # get indices using min index
			
 
				+                    indices = extracts_linear_indices(png_files[int(min_index / input_step):], n_expected=50, indices_step=input_step, start_at=min_index, smooth_arr=True)
			
 
				+
			
 
				+                    # print('Indices found are', indices)
			
 
				+                    # create output directory
			
 
				+                    if not os.path.exists(output_scene_dir):
			
 
				+                        os.makedirs(output_scene_dir)
			
 
				+
			
 
				+                    # get expected png image and move it
			
 
				+                    for index in indices:
			
 
				+                        
			
 
				+                        str_index = str(index)
			
 
				+
			
 
				+                        while len(str_index) < 5:
			
 
				+                            str_index = "0" + str_index
			
 
				+
			
 
				+                        image_name = scene_name + '_' + str_index + '.png'
			
 
				+                        png_image_path = os.path.join(png_folder_scene, image_name)
			
 
				+
			
 
				+                        # create output filepath
			
 
				+                        output_img_filepath = os.path.join(output_scene_dir, image_name)
			
 
				+
			
 
				+                        # copy expected image path
			
 
				+                        shutil.copy2(png_image_path, output_img_filepath)
			
 
				+            else:
			
 
				+                print('Only', n_users, 'users who passed the experiment for', scene)
			
 
				+            
			
 
				+            print('\n---------------------------------------------')
			
 
				+    
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    main()
			
--- a/utils/get_specific_dataset_png_with_mean.py
+++ b/utils/get_specific_dataset_png_with_mean.py
@@ -0,0 +1,210 @@
 
				+# main imports
			
 
				+import os, sys
			
 
				+import argparse
			
 
				+import json
			
 
				+import numpy as np
			
 
				+import shutil
			
 
				+
			
 
				+# PNG images
			
 
				+from PIL import Image
			
 
				+
			
 
				+# others import
			
 
				+from ipfml import utils
			
 
				+from scipy.signal import savgol_filter
			
 
				+
			
 
				+'''
			
 
				+Display progress information as progress bar
			
 
				+'''
			
 
				+def write_progress(progress):
			
 
				+    barWidth = 180
			
 
				+
			
 
				+    output_str = "["
			
 
				+    pos = barWidth * progress
			
 
				+    for i in range(barWidth):
			
 
				+        if i < pos:
			
 
				+           output_str = output_str + "="
			
 
				+        elif i == pos:
			
 
				+           output_str = output_str + ">"
			
 
				+        else:
			
 
				+            output_str = output_str + " "
			
 
				+
			
 
				+    output_str = output_str + "] " + str(int(progress * 100.0)) + " %\r"
			
 
				+    print(output_str)
			
 
				+    sys.stdout.write("\033[F")
			
 
				+
			
 
				+
			
 
				+def extract_index(filepath):
			
 
				+
			
 
				+    return int(filepath.split('_')[-1].split('.')[0])
			
 
				+
			
 
				+
			
 
				+def extracts_linear_indices(images_path, n_expected=50, indices_step=20, start_at=20, smooth_arr=False):
			
 
				+
			
 
				+    # TODO : check this part
			
 
				+    default_add = start_at - indices_step
			
 
				+    
			
 
				+    # extract variance for each image path
			
 
				+    var_arr = []
			
 
				+
			
 
				+    n_counter = 0
			
 
				+    n_images = len(images_path)
			
 
				+
			
 
				+    for p in sorted(images_path):
			
 
				+        img = Image.open(p)
			
 
				+        var_arr.append(np.var(img))
			
 
				+
			
 
				+        n_counter += 1
			
 
				+        write_progress((n_counter + 1) / n_images)
			
 
				+        
			
 
				+    # normalize variance values
			
 
				+    norm_arr = np.array(utils.normalize_arr_with_range(var_arr))
			
 
				+    
			
 
				+    if smooth_arr:
			
 
				+        norm_arr = utils.normalize_arr_with_range(savgol_filter(norm_arr, 201, 3)) # window size 7, polynomial order 3
			
 
				+    
			
 
				+    # get expected linear step (using n_expectec output images)
			
 
				+    linear_steps = utils.normalize_arr_with_range((1 - (np.arange(n_expected) / n_expected)))
			
 
				+    
			
 
				+    # get image indices from variance convergence and linear
			
 
				+    # => when linear step is reached we store the index found from variance values
			
 
				+    indices_found = []
			
 
				+    for i in linear_steps: 
			
 
				+        
			
 
				+        find_index = 0
			
 
				+        
			
 
				+        for index, y in enumerate(norm_arr):
			
 
				+            if i <= y:
			
 
				+                find_index = index
			
 
				+
			
 
				+        indices_found.append(find_index + 1)
			
 
				+
			
 
				+    indices = np.array(indices_found) * indices_step
			
 
				+    
			
 
				+    # add tricks to avoid same indice
			
 
				+    # => when index is same as previous, then add number of samples expected by step 
			
 
				+    # Example with step of 20 : [20, 20, 20, 100, 200] => [20, 40, 60, 100, 200]
			
 
				+    final_indices = []
			
 
				+    for index, i in enumerate(indices):
			
 
				+        value = indices[index]
			
 
				+        if index > 0:
			
 
				+            if i <= indices[index - 1]:
			
 
				+                value = indices[index - 1] + indices_step
			
 
				+                indices[index] = value
			
 
				+
			
 
				+        final_indices.append(value)
			
 
				+        
			
 
				+    return np.array(final_indices) + default_add
			
 
				+
			
 
				+
			
 
				+def main():
			
 
				+    """
			
 
				+    main function which is ran when launching script
			
 
				+    """ 
			
 
				+    parser = argparse.ArgumentParser(description="Compute new dataset scene")
			
 
				+
			
 
				+    parser.add_argument('--file', type=str, help='file data extracted from `utils/extract_stats_freq_and_min.py` script', required=True)
			
 
				+    parser.add_argument('--png_folder', type=str, help='png dataset folder with scene', required=True)
			
 
				+    parser.add_argument('--users', type=int, help='min number of users required per scene', required=True, default=10)
			
 
				+    #parser.add_argument('--samples', type=int, help='expected samples to get for this dataset', required=True, default=10000)
			
 
				+    parser.add_argument('--output', type=str, help='output image folder', required=True)
			
 
				+
			
 
				+    args = parser.parse_args()
			
 
				+
			
 
				+    p_file   = args.file
			
 
				+    p_png_folder = args.png_folder
			
 
				+    p_users  = args.users
			
 
				+    #p_samples = args.samples
			
 
				+    p_output = args.output
			
 
				+
			
 
				+    with open(p_file, 'r') as f:
			
 
				+
			
 
				+        for line in f.readlines():
			
 
				+
			
 
				+            data = line.split(';')
			
 
				+
			
 
				+            scene = data[0]
			
 
				+            n_users = int(data[1])
			
 
				+            min_index = int(data[2])
			
 
				+
			
 
				+            # remove _partX from scene name
			
 
				+            scene_parts = scene.split('_')
			
 
				+            del scene_parts[-1]
			
 
				+            scene_name = '_'.join(scene_parts)
			
 
				+
			
 
				+            output_scene_dir = os.path.join(p_output, scene)
			
 
				+
			
 
				+            if os.path.exists(output_scene_dir):
			
 
				+                print('Extraction of custom indices already done for', scene)
			
 
				+                continue
			
 
				+
			
 
				+            if n_users >= p_users:
			
 
				+                print('Extract custom indices based on minimum index for', scene)
			
 
				+
			
 
				+                png_folder_scene = os.path.join(p_png_folder, scene)
			
 
				+
			
 
				+                if not os.path.exists(png_folder_scene):
			
 
				+                    print(png_folder_scene, 'png folder does not exist')
			
 
				+                else:
			
 
				+                    
			
 
				+                    # get all rawls files
			
 
				+                    png_files = [ os.path.join(png_folder_scene, p) for p in sorted(os.listdir(png_folder_scene)) ]
			
 
				+
			
 
				+                    # extract max samples found for this scene
			
 
				+                    _, filename = os.path.split(png_files[-1])
			
 
				+
			
 
				+                    max_samples = extract_index(filename)
			
 
				+
			
 
				+                    # extract step from these files
			
 
				+                    input_step = int(max_samples / len(png_files))
			
 
				+
			
 
				+                    # get indices using min index
			
 
				+                    indices = extracts_linear_indices(png_files[int(min_index / input_step):], n_expected=50, indices_step=input_step, start_at=min_index, smooth_arr=True)
			
 
				+                    
			
 
				+                    # here add the most noisy image + mean between first predicted and most noisy image
			
 
				+                    min_index = extract_index(png_files[0])
			
 
				+
			
 
				+                    if not min_index in indices:
			
 
				+                    
			
 
				+                        # get mean between min and next one in list
			
 
				+                        mean_index = int((min_index + indices[1]) / 2)
			
 
				+
			
 
				+                        # check mean index step
			
 
				+                        if mean_index % input_step != 0:
			
 
				+                            mean_index = mean_index + (mean_index % input_step)
			
 
				+
			
 
				+                        if not mean_index in indices:
			
 
				+                            indices = np.insert(indices, 0, mean_index)
			
 
				+                        
			
 
				+                        # add min index as first
			
 
				+                        indices = np.insert(indices, 0, min_index)
			
 
				+
			
 
				+                    # print('Indices found are', indices)
			
 
				+                    # create output directory
			
 
				+                    if not os.path.exists(output_scene_dir):
			
 
				+                        os.makedirs(output_scene_dir)
			
 
				+
			
 
				+                    # get expected png image and move it
			
 
				+                    for index in indices:
			
 
				+                        
			
 
				+                        str_index = str(index)
			
 
				+
			
 
				+                        while len(str_index) < 5:
			
 
				+                            str_index = "0" + str_index
			
 
				+
			
 
				+                        image_name = scene_name + '_' + str_index + '.png'
			
 
				+                        png_image_path = os.path.join(png_folder_scene, image_name)
			
 
				+
			
 
				+                        # create output filepath
			
 
				+                        output_img_filepath = os.path.join(output_scene_dir, image_name)
			
 
				+
			
 
				+                        # copy expected image path
			
 
				+                        shutil.copy2(png_image_path, output_img_filepath)
			
 
				+            else:
			
 
				+                print('Only', n_users, 'users who passed the experiment for', scene)
			
 
				+            
			
 
				+            print('\n---------------------------------------------')
			
 
				+    
			
 
				+
			
 
				+
			
 
				+if __name__ == "__main__":
			
 
				+    main()