diff --git a/.circleci/config.yml b/.circleci/config.yml
index 3702b08..d4719af 100644
--- a/.circleci/config.yml
+++ b/.circleci/config.yml
@@ -10,7 +10,6 @@ jobs:
       - image: cimg/python:3.10.2
         environment:
           LIMIT_NUMPY_VERSION: 2.0.0
-          LIMIT_SCIPY_VERSION: 1.13.1
     steps:
       - checkout
       - python/install-packages:
@@ -20,7 +19,7 @@ jobs:
           no_output_timeout: 30m
           command: |
             pip install --upgrade pip
-            pip install --only-binary=numpy,scipy "numpy<$LIMIT_NUMPY_VERSION" "scipy<=$LIMIT_SCIPY_VERSION" Cython pytest pytest-cov codecov
+            pip install --only-binary=numpy,scipy "numpy>$LIMIT_NUMPY_VERSION" Cython pytest pytest-cov codecov
             pip install -e .[tests]
       - run:
           name: Run tests
diff --git a/.github/workflows/python-package.yml b/.github/workflows/python-package.yml
index bb928eb..2357894 100644
--- a/.github/workflows/python-package.yml
+++ b/.github/workflows/python-package.yml
@@ -8,7 +8,7 @@ on:
     branches: [ master ]
   pull_request:
     branches: [ master ]
-
+  
 jobs:
   build:
     name: Building on ${{ matrix.os }}
@@ -16,11 +16,10 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        os: [windows-latest, ubuntu-latest, macos-latest]
+        os: [windows-latest, ubuntu-22.04, macos-latest]
         python-version: ["3.9", "3.10", "3.11", "3.12"]
     env:
       LIMIT_NUMPY_VERSION: 2.0.0
-      LIMIT_SCIPY_VERSION: 1.13.1
     steps:
     - name: Get number of CPU cores
       uses: SimenB/github-actions-cpu-cores@v2
@@ -29,7 +28,7 @@ jobs:
     - uses: actions/checkout@v4
 
     - name: Setup Python ${{ matrix.python-version }}
-      if: ${{ ((matrix.os == 'macos-latest') && (matrix.python-version != '3.9')) }}
+      if: ${{ (matrix.os != 'macos-latest') || ((matrix.os == 'macos-latest') && (matrix.python-version != '3.9')) }}
       uses: actions/setup-python@v5
       id: pysetup
       with:
@@ -55,15 +54,20 @@ jobs:
         python${{ matrix.python-version }} -c "import sys; print(sys.version)"
         pip --version
 
+    - name: Display GLIBCXX versions
+      if: matrix.os == 'ubuntu-22.04'
+      run: | 
+        ls /lib/x86_64-linux-gnu/libstdc*
+        strings /usr/lib/x86_64-linux-gnu/libstdc++.so.6 | grep GLIBCXX        
+
     - name: Upgrade pip wheel setuptools
       run: python${{ matrix.python-version }} -m pip install wheel setuptools pip --upgrade
   
     - name: Install other dependencies
-      run: python${{ matrix.python-version }} -m pip install Cython pytest pytest-cov flake8
+      run: python${{ matrix.python-version }} -m pip install Cython pytest pytest-cov flake8 "numpy>${{ env.LIMIT_NUMPY_VERSION }}" scipy
 
-    - name: Install other dependencies
+    - name: Build extensions and install test dependencies
       run: |
-        python${{ matrix.python-version }} -m pip install Cython pytest pytest-cov flake8 "numpy<${{ env.LIMIT_NUMPY_VERSION }}" "scipy<=${{ env.LIMIT_SCIPY_VERSION }}"
         python${{ matrix.python-version }} setup.py build_ext -j${{ steps.cpu-cores.outputs.count }}
         python${{ matrix.python-version }} -m pip install -e .[tests]
 
diff --git a/.github/workflows/python-publish.yml b/.github/workflows/python-publish.yml
index b0022a7..9fded09 100644
--- a/.github/workflows/python-publish.yml
+++ b/.github/workflows/python-publish.yml
@@ -14,7 +14,6 @@ on:
 
 env:
   LIMIT_NUMPY_VERSION: 2.0.0
-  LIMIT_SCIPY_VERSION: 1.13.1
 
 jobs:
   build-wheels:
@@ -23,7 +22,7 @@ jobs:
     strategy:
       fail-fast: false
       matrix:
-        os: [windows-latest, ubuntu-latest, macos-latest]
+        os: [windows-latest, ubuntu-22.04, macos-latest]
         python-version: ["3.9", "3.10", "3.11", "3.12"]
     steps:
     - uses: actions/checkout@v4
@@ -54,12 +53,18 @@ jobs:
       run: | 
         python${{ matrix.python-version }} -c "import sys; print(sys.version)"
         pip --version
+    
+    - name: Display GLIBCXX versions
+      if: matrix.os == 'ubuntu-22.04'
+      run: | 
+        ls /lib/x86_64-linux-gnu/libstdc*
+        strings /usr/lib/x86_64-linux-gnu/libstdc++.so.6 | grep GLIBCXX
 
     - name: Upgrade pip wheel setuptools
       run: python${{ matrix.python-version }} -m pip install wheel setuptools pip --upgrade
 
     - name: Install numpy, scipy
-      run: pip install "numpy<${{ env.LIMIT_NUMPY_VERSION }}" "scipy<=${{ env.LIMIT_SCIPY_VERSION }}"
+      run: pip install "numpy>${{ env.LIMIT_NUMPY_VERSION }}" scipy
     
     - name: Install other dependencies
       run: |
@@ -72,7 +77,7 @@ jobs:
       run: python${{ matrix.python-version }} setup.py bdist_wheel
         
     - name: Rename Linux wheels to supported platform of PyPI
-      if: matrix.os == 'ubuntu-latest'
+      if: matrix.os == 'ubuntu-22.04'
       run: for f in dist/*.whl; do mv "$f" "$(echo "$f" | sed s/linux/manylinux1/)"; done
 
     - name: Publish wheels to GitHub artifacts
@@ -83,7 +88,7 @@ jobs:
 
   publish-pypi:
     needs: [build-wheels]
-    runs-on: ubuntu-latest
+    runs-on: ubuntu-22.04
     steps:
     - uses: actions/checkout@v4
           
@@ -101,9 +106,14 @@ jobs:
     - name: Display Python version
       run: python -c "import sys; print(sys.version)"
 
-    - name: Install numpy
+    - name: Display GLIBCXX versions
+      run: | 
+        ls /lib/x86_64-linux-gnu/libstdc*
+        strings /usr/lib/x86_64-linux-gnu/libstdc++.so.6 | grep GLIBCXX
+
+    - name: Install numpy, scipy
       run: |
-        python -m pip install "numpy<${{ env.LIMIT_NUMPY_VERSION }}" "scipy<=${{ env.LIMIT_SCIPY_VERSION }}"
+        python -m pip install "numpy>${{ env.LIMIT_NUMPY_VERSION }}" scipy
         python -c "import numpy; print(numpy.__version__)"
 
     - name: Install other dependencies
diff --git a/assets/demo.png b/assets/demo.png
new file mode 100644
index 0000000..924ce48
Binary files /dev/null and b/assets/demo.png differ
diff --git a/assets/feedback-dashboard.png b/assets/feedback-dashboard.png
new file mode 100644
index 0000000..878e4a1
Binary files /dev/null and b/assets/feedback-dashboard.png differ
diff --git a/assets/flow.jpg b/assets/flow.jpg
new file mode 100644
index 0000000..3a6d186
Binary files /dev/null and b/assets/flow.jpg differ
diff --git a/assets/recommendation-dashboard.png b/assets/recommendation-dashboard.png
new file mode 100644
index 0000000..d4a4e66
Binary files /dev/null and b/assets/recommendation-dashboard.png differ
diff --git a/cornac/__init__.py b/cornac/__init__.py
index ec7a115..714e9e7 100644
--- a/cornac/__init__.py
+++ b/cornac/__init__.py
@@ -23,4 +23,4 @@
 # Also importable from root
 from .experiment import Experiment
 
-__version__ = '2.3.0'
+__version__ = "2.3.3"
diff --git a/cornac/augmentation/category.py b/cornac/augmentation/category.py
index 6229dac..7092eb4 100644
--- a/cornac/augmentation/category.py
+++ b/cornac/augmentation/category.py
@@ -33,8 +33,7 @@ def load_model(model_name='facebook/bart-large-mnli', cache_dir= None):
     
     return model, tokenizer
 
-model, tokenizer = load_model()
-classifier = pipeline("zero-shot-classification", model=model,tokenizer=tokenizer)
+_classifier = None
 
 def get_category(row, **kwargs):
     """ Enhance the dataset with its category (e.g. news, sports, life)
@@ -49,9 +48,13 @@ def get_category(row, **kwargs):
     -------
     cat: string, corresponding category name for each news id row
     """
+    global _classifier
     candidate_labels = kwargs.get('candidate_labels')
     meta_data = kwargs.get('meta_data')
     threshold = kwargs.get('threshold', 0.5)
+    if candidate_labels and _classifier is None:
+        model, tokenizer = load_model()
+        _classifier = pipeline("zero-shot-classification", model=model,tokenizer=tokenizer)
 
     if candidate_labels:
          # Ensure row is a string (text)
@@ -59,7 +62,7 @@ def get_category(row, **kwargs):
             raise TypeError(f"Expected row to be str (text), but got {type(row).__name__}")
         try:
             # run classifier
-            res = classifier(row, candidate_labels, multi_label=True)
+            res = _classifier(row, candidate_labels, multi_label=True)
 
             categories = res['labels']
             scores = res['scores']
@@ -83,4 +86,4 @@ def get_category(row, **kwargs):
             return -1
 
     # If no candidate labels and no metadata, return -1 (indicating no category found)
-    return -1  # -1 is the default return value in case of missing candidate_labels and meta_data
+    return -1 
diff --git a/cornac/augmentation/enrich_ne.py b/cornac/augmentation/enrich_ne.py
index bcf2d76..9cff63f 100644
--- a/cornac/augmentation/enrich_ne.py
+++ b/cornac/augmentation/enrich_ne.py
@@ -214,14 +214,14 @@ def lookup_and_update(lookup_dict: EfficientDict, alternative: str, all_alternat
                       wikidata: WikidataQuery, language_tags: List[str] = None):
     # Check if alternative is in lookup_dict
     lookup_result = lookup_dict.get(alternative.lower())
+    # If earlier query get nothing, directly return None
+    if lookup_result == '':
+        return None
     # If already enriched, update all alternatives and return stored value
-    if lookup_result:
+    elif lookup_result:
         for dict_key in all_alternatives:
             lookup_dict.add(dict_key.lower(), lookup_result)
         return lookup_result
-    # If earlier query get nothing, directly return None
-    elif lookup_result == '':
-        return None
 
     # If not queried before, query Wikidata
     if language_tags:
@@ -242,9 +242,6 @@ def get_person_data(wikidata: WikidataQuery, entity: Dict, lookup_person: Effici
     """
     Get person data from Wikidata.
     """
-    # print(entity['text'])
-    # print(lookup_person.main_dict)
-    # print(lookup_person.hash_table)
     info = {
         'key': entity['text'],
         'frequency': entity['frequency'],
@@ -269,9 +266,6 @@ def get_org_data(wikidata: WikidataQuery, entity: Dict, lookup_org: EfficientDic
     """
     Get organization data from Wikidata.
     """
-    # print(entity['text'])
-    # print(lookup_org.main_dict)
-    # print(lookup_org.hash_table)
     info = {
         'frequency': entity['frequency'],
         'alternative': entity['alternative']
diff --git a/cornac/augmentation/min_maj.py b/cornac/augmentation/min_maj.py
index 9a79e11..26391f9 100644
--- a/cornac/augmentation/min_maj.py
+++ b/cornac/augmentation/min_maj.py
@@ -25,8 +25,6 @@ def get_min_maj_ratio(ne_list, **kwargs):
     # Check if ne_list is a valid iterable
     if not isinstance(ne_list, list):
         raise TypeError(f"Invalid input: Expected a list for 'ne_list', but received {type(ne_list).__name__}.")
-        # print("Error: ne_list is not a list. Received:", type(ne_list))
-        # return {}  # Return an empty dictionary if ne_list is not valid
 
     # Iterate through each entity in the named entity list
     for entity in ne_list:
@@ -61,13 +59,11 @@ def get_min_maj_ratio(ne_list, **kwargs):
                         for major_place_of_birth in major_place_of_births:
                             if (major_place_of_birth in entity_dict.get('place_of_birth', [])) or not entity_dict.get('place_of_birth'):
                                 place_of_birth_match = True
-
                         if ethnicity_match and place_of_birth_match:
                             count['ethnicity'][1] += entity_dict.get('frequency', 1)
-                            break
-
-                        count['ethnicity'][0] += entity_dict.get('frequency', 1)
-                        break
+                        else:
+                            count['ethnicity'][0] += entity_dict.get('frequency', 1)
+                        break 
 
                 if not loop_break:
                     count['ethnicity'][0] += entity_dict.get('frequency', 1)
diff --git a/cornac/augmentation/ner.py b/cornac/augmentation/ner.py
index 1e8e32f..c505d14 100644
--- a/cornac/augmentation/ner.py
+++ b/cornac/augmentation/ner.py
@@ -122,8 +122,7 @@ def set_ner_lang(lang='en'):
         return ner
         
     except Exception as e:
-        # print(f"An error occurred while loading the SpaCy model: {e}")
-        # return None
+
         raise RuntimeError(f"An unexpected error occurred while loading the SpaCy model '{model_name}': {e}") from e
 
 
@@ -229,8 +228,6 @@ def get_ner(text, ner_model=set_ner_lang(), **kwargs):
                                      'frequency': len(with_name),
                                      'label': label}))
     except Exception as e:
-        # print(f"An error occurred while getting Named Entities: {e}")
-        # ne_list = None
         raise RuntimeError(f"An error occurred while getting Named Entities: {e}")
 
 
diff --git a/cornac/augmentation/party.py b/cornac/augmentation/party.py
index 3e0f18a..7f156ea 100644
--- a/cornac/augmentation/party.py
+++ b/cornac/augmentation/party.py
@@ -56,8 +56,7 @@ def get_party(ne_list, lang, lookup_parties):
     try:
         if not isinstance(ne_list, list):
             raise ValueError(f"Error: when extraing party, expected ne_list to be a list, but got {type(ne_list)} instead.")
-            # print("Error: ne_list is not a list. Received:", type(ne_list))
-            # return {}, {}
+
 
         for entity in ne_list:
             if isinstance(entity, dict):
@@ -93,9 +92,4 @@ def get_party(ne_list, lang, lookup_parties):
     except Exception as e:
         raise RuntimeError(f"Error in get_party function: {e}")
 
-    # except Exception as e:
-    #     # Log any errors during party extraction but ensure the pipeline continues
-    #     print(f"Error in get_party function: {e}")
-    #     return {}, lookup_parties  # Return empty parties in case of failure, but don't stop the pipeline
-
     return parties, lookup_parties
diff --git a/cornac/augmentation/readability.py b/cornac/augmentation/readability.py
index cc6814b..e218e0f 100644
--- a/cornac/augmentation/readability.py
+++ b/cornac/augmentation/readability.py
@@ -177,30 +177,37 @@ def get_readability(text, lang='en'):
         (https://en.wikipedia.org/wiki/Flesch%E2%80%93Kincaid_readability_tests#Flesch_reading_ease).
 
     """
-    # print(f"Computing readability for language:{lang}")
-    try:
-        textstat.set_lang(lang)
-    except KeyError:  # Handle invalid language codes
-        if lang in new_langs.keys():
-            lang = 'en'  # Default to English
-            textstat.set_lang(lang)  # Set language to English
-        else:
-            # print(f"Language code '{lang}' not supported.")
-            # return None
-            raise ValueError(f"Invalid language code '{lang}' provided. Supported language codes are: {', '.join(new_langs.keys())}")
-    
+     
     if not isinstance(text, str):
         raise TypeError(f"Invalid input: Expected a string for 'text', but received {type(text).__name__}.")
+
+    # Extract language root (e.g., "en" from "en_US")
+    lang_root = lang.split("_")[0]
+    
+    # Check if language is supported by either textstat or our custom configs
+    all_supported_langs = set(textstat_langs + list(new_langs.keys()))
+    
+    if lang_root not in all_supported_langs:
+        raise ValueError(f"Invalid language code '{lang}' provided. Supported language codes are: {', '.join(sorted(all_supported_langs))}")
+    
+    # Only set language if it's valid
+    if lang_root in textstat_langs:
+        textstat.set_lang(lang_root)  # Set to root language for textstat
+    else:
+        # For custom languages, we'll use our own calculations, so set to English as fallback
+        textstat.set_lang('en')
+    
     try:
         if not text:
             return None  # Empty text
         # Check if the text contains any meaningful characters
         if not contains_meaningful_characters(text):
             return None
-        lang_root = lang.split("_")[0]
+        # lang_root = lang.split("_")[0]
         if lang_root in textstat_langs:
             readability = textstat.flesch_reading_ease(text)
         else:
+             # Use our custom formula
             flesch = (
                     get_lang_cfg(lang_root, "fre_base")
                     - float(
@@ -214,8 +221,6 @@ def get_readability(text, lang='en'):
             )
             readability = round(flesch, 2)
     except Exception as e:
-        # print(f"An error occurred while getting readability score: {e}")
-        # readability = None
         raise RuntimeError(f"An error occurred while calculating the readability score: {e}")
 
     return readability
diff --git a/cornac/augmentation/sentiment.py b/cornac/augmentation/sentiment.py
index 7662395..99117f2 100644
--- a/cornac/augmentation/sentiment.py
+++ b/cornac/augmentation/sentiment.py
@@ -2,11 +2,7 @@
 import pandas as pd
 import numpy as np
 import os
-# Load the model and tokenizer from the local directory
-# model_dir = "./augmentation/DataEnhancement/models/xlm_roberta_sentiment"
-# tokenizer = AutoTokenizer.from_pretrained(model_dir)
-# model = AutoModelForSequenceClassification.from_pretrained(model_dir)
-# sentiment_analyzer = pipeline("sentiment-analysis", model=model, tokenizer=tokenizer, top_k=None)
+
 
 def load_model(model_name="cardiffnlp/xlm-roberta-base-sentiment-multilingual", cache_dir=None):
     """Load the model and tokenizer from Hugging Face or use a local cache if available.
@@ -40,10 +36,20 @@ def load_model(model_name="cardiffnlp/xlm-roberta-base-sentiment-multilingual",
     
     return model, tokenizer
 
-model, tokenizer = load_model()
-# Create the sentiment analysis pipeline
-sentiment_analyzer = pipeline("sentiment-analysis", model=model, tokenizer=tokenizer, top_k=None)
 
+# Add global variables for lazy loading
+_model = None
+_tokenizer = None
+_sentiment_analyzer = None
+def get_sentiment_analyzer():
+    """Lazy load the sentiment analyzer only when needed."""
+    global _model, _tokenizer, _sentiment_analyzer
+    
+    if _sentiment_analyzer is None:
+        _model, _tokenizer = load_model()
+        _sentiment_analyzer = pipeline("sentiment-analysis", model=_model, tokenizer=_tokenizer, top_k=None)
+    
+    return _sentiment_analyzer
 
 def get_sentiment(text):
     """ Enhance the dataset with its sentiment (-1.0, 1.0) by analyzing sentiment on a sentence-by-sentence basis,
@@ -66,6 +72,7 @@ def get_sentiment(text):
         return None
 
     try:
+        sentiment_analyzer = get_sentiment_analyzer()
         # Split text into manageable chunks
         if len(text) <= 512:
             merged_sentences = [text]
@@ -108,6 +115,5 @@ def get_sentiment(text):
         return sentiment
 
     except Exception as e:
-        # print(f"Error calculating sentiment for text: '{text[:50]}...'. Error: {e}")
-        # return None
+
         raise RuntimeError(f"Error calculating sentiment for text: '{text[:50]}...'. Error: {e}")
diff --git a/cornac/augmentation/text.py b/cornac/augmentation/text.py
index 3704b96..f8cde23 100644
--- a/cornac/augmentation/text.py
+++ b/cornac/augmentation/text.py
@@ -30,8 +30,7 @@ def find_sentences_with_text(soup, text):
 
         return matching_sentences
     except Exception as e:
-        # print(f"Error finding sentences with text: {e}")
-        # return None
+
         raise Exception(f"Error finding sentences with text: {e}")
 
 
@@ -86,6 +85,5 @@ def get_article_text_from_url(url):
             return article_content_element
 
         except Exception as e:
-            # print("Error:", e, 'for url', url)
-            # return None
+
             raise Exception(f"Error while processing the URL {url}: {e}")
diff --git a/cornac/data/dataset.py b/cornac/data/dataset.py
index 6fe3b71..a68fd62 100644
--- a/cornac/data/dataset.py
+++ b/cornac/data/dataset.py
@@ -21,14 +21,11 @@
 import pickle
 import warnings
 from collections import Counter, OrderedDict, defaultdict
-from collections import Counter, OrderedDict, defaultdict
 
 import numpy as np
 from scipy.sparse import csc_matrix, csr_matrix, dok_matrix
-from scipy.sparse import csc_matrix, csr_matrix, dok_matrix
 
 from ..utils import estimate_batches, get_rng, validate_format
-from ..utils import estimate_batches, get_rng, validate_format
 
 
 class Dataset(object):
diff --git a/cornac/datasets/__init__.py b/cornac/datasets/__init__.py
index 6aa516b..c42bb06 100644
--- a/cornac/datasets/__init__.py
+++ b/cornac/datasets/__init__.py
@@ -15,18 +15,15 @@
 
 from . import amazon_clothing
 from . import amazon_digital_music
-from . import amazon_digital_music
 from . import amazon_office
 from . import amazon_toy
 from . import citeulike
 from . import epinions
 from . import filmtrust
 from . import gowalla
-from . import gowalla
 from . import movielens
 from . import netflix
 from . import tafeng
-from . import tafeng
 from . import tradesy
 from . import yoochoose
 
diff --git a/cornac/eval_methods/base_method.py b/cornac/eval_methods/base_method.py
index 9050d5f..52351a0 100644
--- a/cornac/eval_methods/base_method.py
+++ b/cornac/eval_methods/base_method.py
@@ -167,14 +167,11 @@ def cache_rankings(model, user_idx, item_indices,  k = -1):
         return model.ranked_items[user_idx], model.item_scores[user_idx]
 
 
-    # item_idx2id = {v: k for k, v in test_set.iid_map.items()} # cornac item ID : raw item ID
-    # user_idx2id = {v: k for k, v in test_set.uid_map.items()} # cornac user ID : raw user ID
-    # item_id2idx = {k: v for k, v in test_set.iid_map.items()} # raw item ID : cornac item ID
     if not getattr(model, 'is_fitted', False):
         raise RuntimeError("Model is not fitted. Please call `model.fit()` before ranking.")
     
     item_rank, item_scores = model.rank( user_idx=user_idx, item_indices=item_indices, k=k) 
-    # item_rank, item_scores = model.rank( user_idx=user_idx, item_indices=item_indices, k=k,item_idx2id = item_idx2id, user_idx2id = user_idx2id, item_id2idx =  item_id2idx) 
+
 
 
     # Cache the results for future use
@@ -355,10 +352,7 @@ def preprocess_data_for_Fragmentation(user_idx, test_set, model, metrics, item_i
 
             # Separate cached and uncached samples
             for x in sampled_users:
-                # model_ranked_items, _ = cache_rankings(
-                #     model, x, item_indices, k=-1)
-                # model_ranked_items, _ = cache_rankings(
-                #     model, x, item_indices, k=-1)
+
                 model_ranked_items, _ = cache_rankings(
         model,   user_idx=x, item_indices=item_indices, k=-1)
 
@@ -438,8 +432,7 @@ def pos_items(csr_row):
             globalProbs.append(global_prob)
         else:
             globalProbs.append([])
-    pd_other_users = preprocess_data_for_Fragmentation(
-        user_idx, test_set, model, metrics, item_indices=None)
+
 
 
     for user_idx in tqdm(
@@ -483,6 +476,8 @@ def pos_items(csr_row):
         gd_row = gt_mat.getrow(user_idx)
         u_gt_rating[gd_row.indices] = gd_row.data
 
+        pd_other_users = preprocess_data_for_Fragmentation(
+        user_idx, test_set, model, metrics, item_indices=item_indices)
 
         for i, mt in enumerate(metrics):
             mt_score = mt.compute(
@@ -501,14 +496,11 @@ def pos_items(csr_row):
                 user_results[i][user_idx] = mt_score
 
 
-            # user_results[i][user_idx] = mt_score
-
      # avg results of ranking metrics
     for i, mt in enumerate(metrics):
         values = user_results[i].values()
         avg_results.append(sum(values) / len(values) if values else 0)
-        # avg_results.append(
-        #     sum(user_results[i].values()) / len(user_results[i]))
+
 
     return avg_results, user_results
 
diff --git a/cornac/eval_methods/dynamic_rerank_evaluator.py b/cornac/eval_methods/dynamic_rerank_evaluator.py
index 0be0833..0a35b3d 100644
--- a/cornac/eval_methods/dynamic_rerank_evaluator.py
+++ b/cornac/eval_methods/dynamic_rerank_evaluator.py
@@ -39,9 +39,7 @@ def cache_rankings(model, user_idx, item_indices,  k = -1):
         return model.ranked_items[user_idx], model.item_scores[user_idx]
 
 
-    # item_idx2id = {v: k for k, v in test_set.iid_map.items()} # cornac item ID : raw item ID
-    # user_idx2id = {v: k for k, v in test_set.uid_map.items()} # cornac user ID : raw user ID
-    # item_id2idx = {k: v for k, v in test_set.iid_map.items()} # raw item ID : cornac item ID
+
     if not getattr(model, 'is_fitted', False):
         raise RuntimeError("Model is not fitted. Re-ranking requires the model to be fitted or the candidate lists for all users to be ready. Please call `model.fit()` before ranking.")
 
@@ -58,40 +56,12 @@ def cache_rankings(model, user_idx, item_indices,  k = -1):
 
 
 
-# def cache_rankings(model, user_idx, item_indices, k):
-#     '''
-#     Helper function to compute or load a ranked list for a model for a specific user.
 
-#     This function handles ranking operations by:
-#     1. Returning pre-computed rankings and scores from the cache if available.
-#     2. Computing the rankings and scores if they are not already cached.
 
-#     Key Details:
-#     - Newly computed rankings and scores are stored in the cache for future use.
 
-#     Parameters:
-#     - `model`: The recommender model that performs the ranking.
-#     - `user_idx`: The index of the user for whom the ranking is performed.
-#     - `item_indices`: The list of item indices to be ranked.
 
-#     Returns:
-#     - `item_rank`: The ranked list of items for the user.
-#     - `item_scores`: The scores of items corresponding to index in `item_indices` input.
-#     '''
-#     if not hasattr(model, 'ranked_items'):
-#         model.ranked_items = {}
-#     if not hasattr(model, 'item_scores'):
-#         model.item_scores = {}
 
-#     if user_idx in model.ranked_items and user_idx in model.item_scores:
-#         return model.ranked_items[user_idx], model.item_scores[user_idx]
-    
-#     item_rank, item_scores = model.rank( user_idx=user_idx, item_indices=item_indices, k=k)
-  
-#     model.ranked_items[user_idx] = item_rank
-#     model.item_scores[user_idx] = item_scores
 
-#     return item_rank, item_scores
 
 def cache_dynamic_rerankings(reranker, user_idx, train_set, initial_item_rank, recommendation_list, prediction_scores):
     '''
@@ -130,14 +100,12 @@ def cache_dynamic_rerankings(reranker, user_idx, train_set, initial_item_rank, r
     if not hasattr(reranker, 'ranked_items'):
         reranker.ranked_items = {}
     
-    # item_idx2id = {v: k for k, v in test_set.iid_map.items()} # cornac item ID : raw item ID
-    # user_idx2id = {v: k for k, v in test_set.uid_map.items()} # cornac user ID : raw user ID
-    # item_id2idx = {k: v for k, v in test_set.iid_map.items()} # raw item ID : cornac item ID
+
 
     start_time = time.time()
     reranked_list = reranker.rerank(
                     user_idx = user_idx, interaction_history = train_set, candidate_items = initial_item_rank, prediction_scores = prediction_scores, recommendation_list = recommendation_list)
-                            # item_idx2id = item_idx2id, user_idx2id = user_idx2id, item_id2idx =  item_id2idx)
+
 
     reranking_time = time.time() - start_time
 
@@ -266,8 +234,7 @@ def pos_items(csr_row):
         if len(u_gt_pos_items) == 0:
             continue  # Skip if no impression items are clicked for this user
         
-        # item_rank, item_scores = cache_rankings(
-        # model, user_idx,  item_indices, k = -1)
+
         item_rank, item_scores = cache_rankings(
         model,   user_idx=user_idx, item_indices=item_indices, k=-1)
 
@@ -386,8 +353,7 @@ def preprocess_data_for_Fragmentation(user_idx, test_set,  train_set, model, rer
 
             # Separate cached and uncached samples
             for x in sampled_users:
-                # model_ranked_items, model_ranked_scores = cache_rankings(
-                #     model, x, item_indices, k = -1)
+
 
                 model_ranked_items, model_ranked_scores = cache_rankings(
         model,   user_idx = x, item_indices=item_indices, k=-1)
@@ -493,16 +459,25 @@ def pos_items(csr_row):
 
     user_history_dict = OrderedDict()
 
-    def pos_items(csr_row):
-        return [
-            item_idx
-            for (item_idx, rating) in zip(csr_row.indices, csr_row.data)
-            if rating >= rating_threshold
-        ]
     test_user_indices = set(test_set.uir_tuple[0])
     for user_idx in test_user_indices:
+        pos_item_idx = (
+            pos_items(train_mat.getrow(user_idx))
+            if user_idx < train_mat.shape[0]
+            else []
+        )
+        user_history_dict[user_idx] = pos_item_idx
     
-        user_history_dict[user_idx] = pos_items(train_mat.getrow(user_idx))
+    # check if metrics contain Binomial
+    globalProbs = []
+
+    for i, mt in enumerate(metrics):
+        if "Binomial" in mt.name:
+            global_prob = mt.globalFeatureProbs(user_history_dict)
+            globalProbs.append(global_prob)
+        else:
+            globalProbs.append([])
+
     for user_idx in tqdm(
             test_user_indices, desc="Diversity evaluation on Dynamic rerankers", disable=not verbose, miniters=100
     ):
@@ -552,16 +527,6 @@ def pos_items(csr_row):
         u_gt_rating[gd_item_idx] = gd_item_rating
         # interacted and positive rating in training set
         user_history = user_history_dict.get(user_idx, [])
-        # check if metrics contain Binomial
-        globalProbs = []
-        for i, mt in enumerate(metrics):
-            if "Binomial" in mt.name:
-                global_prob = mt.globalFeatureProbs(user_history_dict)
-                globalProbs.append(global_prob)
-            else:
-                globalProbs.append([])
-        
-        
         
         for j in range(len(rerankers)):
             reranker = rerankers[j]
diff --git a/cornac/eval_methods/ratio_split.py b/cornac/eval_methods/ratio_split.py
index f4c48ed..269893a 100644
--- a/cornac/eval_methods/ratio_split.py
+++ b/cornac/eval_methods/ratio_split.py
@@ -1,5 +1,4 @@
 # Copyright 2018 The Cornac Authors. All Rights Reserved.
-############################################################################
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -18,9 +17,6 @@
 
 from .base_method import BaseMethod
 from ..utils.common import safe_indexing
-from .static_rerank_evaluator import StaticReRankEval
-from .dynamic_rerank_evaluator import DynamicReRankEval
-from ..experiment.result import Result
 
 
 class RatioSplit(BaseMethod):
@@ -127,16 +123,4 @@ def _split(self):
         test_data = safe_indexing(self.data, test_idx)
         val_data = safe_indexing(self.data, val_idx) if len(val_idx) > 0 else None
 
-        self.build(train_data=train_data,
-                   test_data=test_data, val_data=val_data)
-
-
-
-
-
-
-
-      
-
-
-    
\ No newline at end of file
+        self.build(train_data=train_data, test_data=test_data, val_data=val_data)
diff --git a/cornac/eval_methods/static_rerank_evaluator.py b/cornac/eval_methods/static_rerank_evaluator.py
index 7c5db0b..4fa4527 100644
--- a/cornac/eval_methods/static_rerank_evaluator.py
+++ b/cornac/eval_methods/static_rerank_evaluator.py
@@ -88,41 +88,7 @@ def cache_rankings(model, user_idx, item_indices, k = -1):
 
     return item_rank, item_scores
 
-# def cache_rankings(model, user_idx, item_indices, k):
-#     '''
-#     Helper function to compute or load a ranked list for a model for a specific user.
-
-#     This function handles ranking operations by:
-#     1. Returning pre-computed rankings and scores from the cache if available.
-#     2. Computing the rankings and scores if they are not already cached.
-
-#     Key Details:
-#     - Newly computed rankings and scores are stored in the cache for future use.
-
-#     Parameters:
-#     - `model`: The recommender model that performs the ranking.
-#     - `user_idx`: The index of the user for whom the ranking is performed.
-#     - `item_indices`: The list of item indices to be ranked.
-
-#     Returns:
-#     - `item_rank`: The ranked list of items for the user.
-#     - `item_scores`: The scores of items corresponding to index in `item_indices` input.
-#     '''
-#     if not hasattr(model, 'ranked_items'):
-#         model.ranked_items = {}
-#     if not hasattr(model, 'item_scores'):
-#         model.item_scores = {}
-
-#     if user_idx in model.ranked_items and user_idx in model.item_scores:
-#         # print(f"Found model {model.name} recommendation for user: {user_idx}")
-#         return model.ranked_items[user_idx], model.item_scores[user_idx]
-    
-#     item_rank, item_scores = model.rank( user_idx=user_idx, item_indices=item_indices, k=k)
-  
-#     model.ranked_items[user_idx] = item_rank
-#     model.item_scores[user_idx] = item_scores
 
-#     return item_rank, item_scores
 
 
 def cache_rerankings(reranker, user_idx, train_set, model_ranked_items, model_ranked_scores):
@@ -510,8 +476,22 @@ def pos_items(csr_row):
         ]
     test_user_indices = set(test_set.uir_tuple[0])
     for user_idx in test_user_indices:
+        pos_item_idx = (
+            pos_items(train_mat.getrow(user_idx))
+            if user_idx < train_mat.shape[0]
+            else []
+        )
+        user_history_dict[user_idx] = pos_item_idx
     
-        user_history_dict[user_idx] = pos_items(train_mat.getrow(user_idx))
+    globalProbs = []
+
+    for i, mt in enumerate(metrics):
+        if "Binomial" in mt.name:
+            global_prob = mt.globalFeatureProbs(user_history_dict)
+            globalProbs.append(global_prob)
+        else:
+            globalProbs.append([])
+
 
     for user_idx in tqdm(
         test_user_indices, desc="Diversity Eval on Re-ranking Results", disable=not verbose, miniters=100
@@ -601,14 +581,9 @@ def pos_items(csr_row):
         u_gt_rating[gd_item_idx] = gd_item_rating
 
         user_history = user_history_dict.get(user_idx, [])
-        globalProbs = []
+  
         pd_other_users = []
-        for i, mt in enumerate(metrics):
-            if "Binomial" in mt.name:
-                global_prob = mt.globalFeatureProbs(user_history_dict)
-                globalProbs.append(global_prob)
-            else:
-                globalProbs.append([])
+        
   
         # Compute metric times and store results
         user_results = [
diff --git a/cornac/experiment/pipelineExperiment.py b/cornac/experiment/pipelineExperiment.py
index aa46f2a..e9cf647 100644
--- a/cornac/experiment/pipelineExperiment.py
+++ b/cornac/experiment/pipelineExperiment.py
@@ -20,7 +20,7 @@
 import numpy as np
 from ..eval_methods.static_rerank_evaluator import StaticReRankEval
 from ..eval_methods.dynamic_rerank_evaluator import DynamicReRankEval
-
+from .result import ExperimentResult
 
 class PipelineExperiment(Experiment):
     """PipelineExperiment Class
@@ -44,7 +44,6 @@ class PipelineExperiment(Experiment):
     """
 
     def __init__(self,
-                 
                  model,
                  metrics,
                 eval_method = None,
@@ -52,6 +51,7 @@ def __init__(self,
                  user_based=True,
                  show_validation=True,
                  verbose=False,
+                 save_dir='.',
                  pipeline_config_file=None):
         """
         Initializes the PipelineExperiment class, setting up models, metrics, rerankers, and configuration 
@@ -77,6 +77,10 @@ def __init__(self,
         verbose : bool, optional (default=False)
             If True, detailed logs and debug information will be printed.
 
+        save_dir: str, optional, default: '.'
+            Path to a directory for storing logs. By default, 
+           logs will be saved in the current working directory.
+
         pipeline_config_file : str, optional
             Path to an .ini configuration file specifying pipeline parameters.
 
@@ -94,9 +98,6 @@ def __init__(self,
         eval_method : cornac.eval_methods.BaseMethod
             Evaluation method used to split the dataset and compute metrics.
 
-        save_dir : str
-            Directory to save evaluation results and recommendations.
-
         models : Recommender
             The recommender model being evaluated.
 
@@ -142,10 +143,8 @@ def __init__(self,
             self.eval_method = self.load_dataset(self.config)
         else:
             self.eval_method = eval_method 
-        self.save_dir = self.config['pipeline'].get(
-            'save_dir', '.')
+        self.save_dir = save_dir
         os.makedirs(self.save_dir, exist_ok=True)
-        
         #  self.models is a `recommender`` object. This pipeline can only process one model.
         self.model = self._validate_models(model)
         # Validate and assign rerankers
@@ -430,38 +429,6 @@ def load_model_scores(self, save_dir):
 
         return item_scores, item_scores_mapped_indices
     
-    def save_results(self, test_result, val_result, save_dir, result_type="model"):
-        """
-        Save the results of the experiment to the specified directory.
-
-        Parameters:
-        -----------
-        test_result : object
-            The test result to save.
-        val_result : object or None
-            The validation result to save, if applicable.
-        save_dir : str
-            Directory to save the results.
-        result_type : str, optional
-            The type of result being saved (e.g., 'model', 'static_reranker'). Default is 'model'.
-
-        """
-        # Check if `all_test_results` attribute exists, if not create it as a dictionary
-        if not hasattr(self, 'all_test_results'):
-            self.all_test_results = {}
-
-        # Add or update the test result for the given result type
-        self.all_test_results[result_type] = test_result
-
-        # If validation results need to be saved separately (optional)
-        if not hasattr(self, 'all_val_results'):
-            self.all_val_results = {}
-
-        if val_result is not None:
-            self.all_val_results[result_type] = val_result
-
-        # Define the path to save the recommendation dictionary
-        test_result.save(save_dir)
 
     def check_missing_recommendations(self, model, eval_method):
         """
@@ -512,6 +479,11 @@ def pos_items(csr_row):
                 missing_user_indices.append(user_idx)
 
         return missing_user_indices
+    
+    def _create_result(self):
+        super()._create_result()
+        self.rerank_result = ExperimentResult()
+
 
     def run(self):
         """
@@ -534,9 +506,12 @@ def run(self):
                 user_based=self.user_based,
                 show_validation=self.show_validation
             )
+            self.result.append(test_result)
+            if self.val_result is not None:
+                self.val_result.append(val_result)
 
-            self.save_results(test_result, val_result,
-                              self.mode_and_paths["model"]['save_eval_path'])
+            test_result.save(self.mode_and_paths["model"]['save_eval_path'])
+                             
             self.model.save_recommendations(
                 self.mode_and_paths["model"]['path'])
             output += "\n" + "="*8 + "model test result" + \
@@ -567,8 +542,10 @@ def run(self):
                 show_validation=self.show_validation,
                 train_mode=False
             )
-            self.save_results(test_result, val_result,
-                              self.mode_and_paths["model"]['save_eval_path'])
+            self.result.append(test_result)
+            if self.val_result is not None:
+                self.val_result.append(val_result)
+            test_result.save(self.mode_and_paths["model"]['save_eval_path'])
 
             output += "\n" + "="*8 + "model test result" + \
                 "="*8 + "\n"+"{}".format(test_result)
@@ -584,8 +561,7 @@ def run(self):
 
             self.model.item_scores, self.model.item_scores_mapped_indices = self.load_model_scores(save_dir)
 
-            # self.model.item_scores = self.load_model_scores(save_dir)
-
+            
             # models.ranked_items must contain recommendation list for all user idx in the test_set!
             # check if the self.models.ranked_items ready.
             missing_user_indices = self.check_missing_recommendations(
@@ -606,9 +582,8 @@ def run(self):
 
             test_result_static_reranker, val_result_static_reranker = static_reranker_evaluator.evaluate(
                 model=self.model, metrics=self.metrics,    user_based=self.user_based, rerankers=self.rerankers,  show_validation=self.show_validation)
-
-            self.save_results(test_result_static_reranker, val_result_static_reranker,
-                              self.mode_and_paths["static_reranker"]['save_eval_path'], result_type="static_reranker")
+            self.rerank_result.append(test_result_static_reranker)
+            test_result_static_reranker.save(self.mode_and_paths["static_reranker"]['save_eval_path'])
 
             output += "\n" + "="*8 + "static rerankers test result" + \
                 "="*8 + "\n"+"{}".format(test_result_static_reranker)
@@ -627,8 +602,8 @@ def run(self):
 
             test_result_static_reranker, val_result_static_reranker = static_reranker_evaluator.evaluate(
                 model=self.model, metrics=self.metrics,    user_based=self.user_based, rerankers=self.rerankers,  show_validation=self.show_validation)
-            self.save_results(test_result_static_reranker, val_result_static_reranker,
-                              self.mode_and_paths["static_reranker"]['save_eval_path'], result_type="static_reranker")
+            self.rerank_result.append(test_result_static_reranker)
+            test_result_static_reranker.save(self.mode_and_paths["static_reranker"]['save_eval_path'])
 
             output += "\n" + "="*8 + "static rerankers test result" + \
                 "="*8 + "\n"+"{}".format(test_result_static_reranker)
@@ -636,9 +611,8 @@ def run(self):
             dyn_reranker_evaluator = DynamicReRankEval(self.eval_method)
             test_result_dyn, val_result_dyn = dyn_reranker_evaluator.evaluate(
                 model=self.model, metrics=self.metrics, user_based = False, rerankers=self.dynamic_rerankers, show_validation=self.show_validation)
-
-            self.save_results(test_result_dyn, val_result_dyn,
-                              self.mode_and_paths["dynamic_reranker"]['save_eval_path'], result_type="dynamic_reranker")
+            self.rerank_result.append(test_result_dyn)
+            test_result_dyn.save(self.mode_and_paths["dynamic_reranker"]['save_eval_path'])
 
             output += "\n" + "="*8 + "dynamic rerankers test result" + \
                 "="*8 + "\n" + "{}".format(test_result_dyn)
@@ -656,9 +630,9 @@ def run(self):
             dyn_reranker_evaluator = DynamicReRankEval(self.eval_method)
             test_result_dyn, val_result_dyn = dyn_reranker_evaluator.evaluate(
                                 model=self.model, metrics=self.metrics, user_based = False, rerankers=self.dynamic_rerankers, show_validation=self.show_validation)
-
-            self.save_results(test_result_dyn, val_result_dyn,
-                              self.mode_and_paths["dynamic_reranker"]['save_eval_path'], result_type="dynamic_reranker")
+            
+            self.rerank_result.append(test_result_dyn)
+            test_result_dyn.save(self.mode_and_paths["dynamic_reranker"]['save_eval_path'])
 
             output += "\n" + "="*8 + "dynamic rerankers test result" + \
                 "="*8 + "\n" + "{}".format(test_result_dyn)
diff --git a/cornac/experiment/result.py b/cornac/experiment/result.py
index 46dad6f..f4b8765 100644
--- a/cornac/experiment/result.py
+++ b/cornac/experiment/result.py
@@ -1,5 +1,5 @@
 # Copyright 2018 The Cornac Authors. All Rights Reserved.
-############################################################################
+#
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
 # You may obtain a copy of the License at
@@ -237,8 +237,8 @@ def organize(self):
         unbiased = np.average(data[2:], axis=0, weights=weights[2:]) * sum(weights[2:])
 
         # weighted average does not meaningful for size
-        for idx, headers in enumerate(headers):
-            if headers == "SIZE":
+        for idx, header in enumerate(headers):
+            if header == "SIZE":
                 unbiased[idx] = sizes[0]
 
         # update the table
@@ -260,7 +260,7 @@ def organize(self):
 
 class ExperimentResult(list):
     """
-    Result Class for an Experiment. A list of obj:`cornac.experiment.Result`. 
+    Result Class for an Experiment. A list of :obj:`cornac.experiment.Result`. 
     """
 
     def __str__(self):
@@ -308,4 +308,4 @@ class CVExperimentResult(ExperimentResult):
     """
 
     def __str__(self):
-        return "\n".join([r.__str__() for r in self])
\ No newline at end of file
+        return "\n".join([r.__str__() for r in self])
diff --git a/cornac/metrics/ranking.py b/cornac/metrics/ranking.py
index e84a3ec..4d04d1d 100644
--- a/cornac/metrics/ranking.py
+++ b/cornac/metrics/ranking.py
@@ -91,7 +91,7 @@ def dcg_score(gt_pos, pd_rank, k=-1):
         else:
             truncated_pd_rank = pd_rank
 
-        ranked_scores = np.in1d(truncated_pd_rank, gt_pos).astype(int)
+        ranked_scores = np.isin(truncated_pd_rank, gt_pos).astype(int)
         gain = 2**ranked_scores - 1
         discounts = np.log2(np.arange(len(ranked_scores)) + 2)
 
@@ -162,7 +162,7 @@ def compute(self, gt_pos, pd_rank, **kwargs):
             truncated_pd_rank = pd_rank
 
         # Compute CRR
-        rec_rank = np.where(np.in1d(truncated_pd_rank, gt_pos))[0]
+        rec_rank = np.where(np.isin(truncated_pd_rank, gt_pos))[0]
         if len(rec_rank) == 0:
             return 0.0
         rec_rank = rec_rank + 1  # +1 because indices starts from 0 in python
@@ -210,7 +210,7 @@ def compute(self, gt_pos, pd_rank, **kwargs):
             Mean Reciprocal Rank score.
 
         """
-        matched_items = np.nonzero(np.in1d(pd_rank, gt_pos))[0]
+        matched_items = np.nonzero(np.isin(pd_rank, gt_pos))[0]
 
         if len(matched_items) == 0:
             raise ValueError(
@@ -267,7 +267,7 @@ def compute(self, gt_pos, pd_rank, **kwargs):
         else:
             truncated_pd_rank = pd_rank
 
-        tp = np.sum(np.in1d(truncated_pd_rank, gt_pos))
+        tp = np.sum(np.isin(truncated_pd_rank, gt_pos))
         tp_fn = len(gt_pos)
         tp_fp = self.k if self.k > 0 else len(truncated_pd_rank)
 
@@ -470,11 +470,11 @@ def compute(self, item_indices, pd_scores, gt_pos, gt_neg=None, **kwargs):
 
         """
 
-        gt_pos_mask = np.in1d(item_indices, gt_pos)
+        gt_pos_mask = np.isin(item_indices, gt_pos)
         gt_neg_mask = (
             np.logical_not(gt_pos_mask)
             if gt_neg is None
-            else np.in1d(item_indices, gt_neg)
+            else np.isin(item_indices, gt_neg)
         )
 
         pos_scores = pd_scores[gt_pos_mask]
@@ -519,7 +519,7 @@ def compute(self, item_indices, pd_scores, gt_pos, **kwargs):
             AP score.
 
         """
-        relevant = np.in1d(item_indices, gt_pos)
+        relevant = np.isin(item_indices, gt_pos)
         rank = rankdata(-pd_scores, "max")[relevant]
         L = rankdata(-pd_scores[relevant], "max")
         ans = (L / rank).mean()
diff --git a/cornac/models/__init__.py b/cornac/models/__init__.py
index 09a925e..1199560 100644
--- a/cornac/models/__init__.py
+++ b/cornac/models/__init__.py
@@ -16,21 +16,14 @@
 from .recommender import Recommender
 from .recommender import NextBasketRecommender
 from .recommender import NextItemRecommender
-from .recommender import NextBasketRecommender
-from .recommender import NextItemRecommender
 
 from .amr import AMR
 from .ann import AnnoyANN
 from .ann import FaissANN
 from .ann import HNSWLibANN
 from .ann import ScaNNANN
-from .ann import AnnoyANN
-from .ann import FaissANN
-from .ann import HNSWLibANN
-from .ann import ScaNNANN
 from .baseline_only import BaselineOnly
 from .beacon import Beacon
-from .beacon import Beacon
 from .bivaecf import BiVAECF
 from .bpr import BPR
 from .bpr import WBPR
@@ -40,7 +33,6 @@
 from .cdr import CDR
 from .coe import COE
 from .companion import Companion
-from .companion import Companion
 from .comparer import ComparERObj
 from .comparer import ComparERSub
 from .conv_mf import ConvMF
@@ -49,34 +41,22 @@
 from .cvaecf import CVAECF
 from .dmrl import DMRL
 from .dnntsp import DNNTSP
-from .dmrl import DMRL
-from .dnntsp import DNNTSP
 from .ease import EASE
-
 from .efm import EFM
-from .enmf import ENMF
-
 from .fm import FM
 from .gcmc import GCMC
-
 from .global_avg import GlobalAvg
 from .gp_top import GPTop
 from .gru4rec import GRU4Rec
-from .gp_top import GPTop
-from .gru4rec import GRU4Rec
 from .hft import HFT
 from .hpf import HPF
 from .hrdr import HRDR
 from .hypar import HypAR
-from .hrdr import HRDR
-from .hypar import HypAR
 from .ibpr import IBPR
 from .knn import ItemKNN
 from .knn import UserKNN
 from .lightgcn import LightGCN
 from .lrppm import LRPPM
-from .lightgcn import LightGCN
-from .lrppm import LRPPM
 from .mcf import MCF
 from .mf import MF
 from .mmmf import MMMF
@@ -87,25 +67,20 @@
 from .ncf import MLP
 from .ncf import NeuMF
 from .ngcf import NGCF
-from .ngcf import NGCF
 from .nmf import NMF
 from .online_ibpr import OnlineIBPR
 from .pcrl import PCRL
 from .pmf import PMF
 from .recvae import RecVAE
-from .recvae import RecVAE
+from .sansa import SANSA
 from .sbpr import SBPR
 from .skm import SKMeans
 from .sorec import SoRec
 from .spop import SPop
-from .spop import SPop
 from .svd import SVD
 from .tifuknn import TIFUKNN
 from .trirank import TriRank
 from .upcf import UPCF
-from .tifuknn import TIFUKNN
-from .trirank import TriRank
-from .upcf import UPCF
 from .vaecf import VAECF
 from .vbpr import VBPR
 from .vmf import VMF
diff --git a/cornac/models/beacon/recom_beacon.py b/cornac/models/beacon/recom_beacon.py
index 93d1b06..b7c6f69 100644
--- a/cornac/models/beacon/recom_beacon.py
+++ b/cornac/models/beacon/recom_beacon.py
@@ -270,7 +270,7 @@ def _remove_diag(self, adj_matrix):
 
     def _normalize(self, adj_matrix: csr_matrix):
         """Symmetrically normalize adjacency matrix."""
-        row_sum = adj_matrix.sum(1).A.squeeze()
+        row_sum = adj_matrix.sum(1).toarray().squeeze()
         d_inv_sqrt = np.power(
             row_sum,
             -0.5,
diff --git a/cornac/models/bivaecf/bivae.py b/cornac/models/bivaecf/bivae.py
index a66f9d3..2488078 100644
--- a/cornac/models/bivaecf/bivae.py
+++ b/cornac/models/bivaecf/bivae.py
@@ -20,7 +20,6 @@
 import torch.nn as nn
 from tqdm.auto import trange
 
-
 EPS = 1e-10
 
 ACT = {
@@ -136,7 +135,7 @@ def loss(self, x, x_, mu, mu_prior, std, kl_beta):
         # Likelihood
         ll_choices = {
             "bern": x * torch.log(x_ + EPS) + (1 - x) * torch.log(1 - x_ + EPS),
-            "gaus": -(x - x_) ** 2,
+            "gaus": -((x - x_) ** 2),
             "pois": x * torch.log(x_ + EPS) - x_,
         }
 
@@ -198,7 +197,7 @@ def learn(
         i_count = 0
         for i_ids in train_set.item_iter(batch_size, shuffle=False):
             i_batch = tx[i_ids, :]
-            i_batch = i_batch.A
+            i_batch = i_batch.toarray()
             i_batch = torch.tensor(i_batch, dtype=dtype, device=device)
 
             # Reconstructed batch
@@ -228,7 +227,7 @@ def learn(
         u_count = 0
         for u_ids in train_set.user_iter(batch_size, shuffle=False):
             u_batch = x[u_ids, :]
-            u_batch = u_batch.A
+            u_batch = u_batch.toarray()
             u_batch = torch.tensor(u_batch, dtype=dtype, device=device)
 
             # Reconstructed batch
@@ -259,7 +258,7 @@ def learn(
     # infer mu_beta
     for i_ids in train_set.item_iter(batch_size, shuffle=False):
         i_batch = tx[i_ids, :]
-        i_batch = i_batch.A
+        i_batch = i_batch.toarray()
         i_batch = torch.tensor(i_batch, dtype=dtype, device=device)
 
         beta, _, i_mu, _ = bivae(i_batch, user=False, theta=bivae.theta)
@@ -268,7 +267,7 @@ def learn(
     # infer mu_theta
     for u_ids in train_set.user_iter(batch_size, shuffle=False):
         u_batch = x[u_ids, :]
-        u_batch = u_batch.A
+        u_batch = u_batch.toarray()
         u_batch = torch.tensor(u_batch, dtype=dtype, device=device)
 
         theta, _, u_mu, _ = bivae(u_batch, user=True, beta=bivae.beta)
diff --git a/cornac/models/bpr/recom_bpr.pyx b/cornac/models/bpr/recom_bpr.pyx
index 3d3387f..85a606b 100644
--- a/cornac/models/bpr/recom_bpr.pyx
+++ b/cornac/models/bpr/recom_bpr.pyx
@@ -37,6 +37,8 @@ from ...utils.common import scale
 from ...utils.init_utils import zeros, uniform
 
 
+DTYPE = np.float32
+
 cdef extern from "recom_bpr.h" namespace "recom_bpr" nogil:
     cdef int get_thread_num()
 
@@ -119,7 +121,7 @@ class BPR(Recommender, ANNMixin):
         seed=None
     ):
         super().__init__(name=name, trainable=trainable, verbose=verbose)
-        self.k = k
+        self.k = int(k)
         self.max_iter = max_iter
         self.learning_rate = learning_rate
         self.lambda_reg = lambda_reg
@@ -144,10 +146,10 @@ class BPR(Recommender, ANNMixin):
         n_users, n_items = self.total_users, self.total_items
 
         if self.u_factors is None:
-            self.u_factors = (uniform((n_users, self.k), random_state=self.rng) - 0.5) / self.k
+            self.u_factors = (uniform((n_users, self.k), random_state=self.rng, dtype=DTYPE) - 0.5) / self.k
         if self.i_factors is None:
-            self.i_factors = (uniform((n_items, self.k), random_state=self.rng) - 0.5) / self.k
-        self.i_biases = zeros(n_items) if self.i_biases is None or self.use_bias is False else self.i_biases
+            self.i_factors = (uniform((n_items, self.k), random_state=self.rng, dtype=DTYPE) - 0.5) / self.k
+        self.i_biases = zeros(n_items, dtype=DTYPE) if self.i_biases is None or self.use_bias is False else self.i_biases
 
     def _prepare_data(self, train_set):
         X = train_set.matrix # csr_matrix
@@ -214,7 +216,6 @@ class BPR(Recommender, ANNMixin):
         """
         cdef:
             long num_samples = len(user_ids), s, i_index, j_index, correct = 0, skipped = 0
-            long num_items = self.num_items
             integral f, i_id, j_id, thread_id
             floating z, score, temp
             bool use_bias = self.use_bias
diff --git a/cornac/models/cdl/recom_cdl.py b/cornac/models/cdl/recom_cdl.py
index b50709f..106acd0 100644
--- a/cornac/models/cdl/recom_cdl.py
+++ b/cornac/models/cdl/recom_cdl.py
@@ -18,11 +18,11 @@
 
 from ..recommender import Recommender
 from ..recommender import ANNMixin, MEASURE_DOT
-from ..recommender import ANNMixin, MEASURE_DOT
 from ...exception import ScoreException
 from ...utils import get_rng
 from ...utils.init_utils import xavier_uniform
 
+
 class CDL(Recommender, ANNMixin):
     """Collaborative Deep Learning.
 
@@ -243,7 +243,7 @@ def _fit_cdl(self, train_set):
                     feed_dict = {
                         model.text_mask: corruption_mask[batch_ids, :],
                         model.text_input: text_feature[batch_ids],
-                        model.ratings: batch_R.A,
+                        model.ratings: batch_R.toarray(),
                         model.C: batch_C,
                         model.item_ids: batch_ids,
                     }
diff --git a/cornac/models/ctr/ctr.py b/cornac/models/ctr/ctr.py
index 0c34c29..6dc5508 100644
--- a/cornac/models/ctr/ctr.py
+++ b/cornac/models/ctr/ctr.py
@@ -29,7 +29,7 @@ def _df_simplex(gamma, v, lambda_v, x):
 
 
 def _is_on_simplex(v, s):
-    if v.sum() < s + 1e-10 and np.alltrue(v > 0):
+    if v.sum() < s + 1e-10 and np.all(v > 0):
         return True
     return False
 
diff --git a/cornac/models/cvae/recom_cvae.py b/cornac/models/cvae/recom_cvae.py
index 66eb5e5..30a6b98 100644
--- a/cornac/models/cvae/recom_cvae.py
+++ b/cornac/models/cvae/recom_cvae.py
@@ -16,11 +16,10 @@
 import numpy as np
 from tqdm.auto import trange
 
-from ..recommender import Recommender
-from ..recommender import ANNMixin, MEASURE_DOT
 from ...exception import ScoreException
 from ...utils import get_rng
 from ...utils.init_utils import xavier_uniform
+from ..recommender import MEASURE_DOT, Recommender
 
 
 class CVAE(Recommender):
@@ -175,9 +174,10 @@ def _fit_cvae(self, train_set):
         )  # normalization
 
         # VAE initialization
-        from .cvae import Model
         import tensorflow.compat.v1 as tf
 
+        from .cvae import Model
+
         tf.disable_eager_execution()
 
         tf.set_random_seed(self.seed)
@@ -216,7 +216,7 @@ def _fit_cvae(self, train_set):
 
                 feed_dict = {
                     model.x: document[batch_ids],
-                    model.ratings: batch_R.A,
+                    model.ratings: batch_R.toarray(),
                     model.C: batch_C,
                     model.item_ids: batch_ids,
                 }
@@ -235,7 +235,7 @@ def _fit_cvae(self, train_set):
 
         tf.reset_default_graph()
 
-    def score(self, user_idx, item_idx=None, **kwargs):
+    def score(self, user_idx, item_idx=None,  **kwargs):
         """Predict the scores/ratings of a user for an item.
 
         Parameters
diff --git a/cornac/models/cvaecf/cvaecf.py b/cornac/models/cvaecf/cvaecf.py
index b7635b4..6367e6f 100644
--- a/cornac/models/cvaecf/cvaecf.py
+++ b/cornac/models/cvaecf/cvaecf.py
@@ -139,7 +139,7 @@ def loss(self, x, x_, mu_qz, logvar_qz, mu_qhx, logvar_qhx, mu_qhy, logvar_qhy,
         ll_choices = {
             "mult": x * torch.log(x_ + EPS),
             "bern": x * torch.log(x_ + EPS) + (1 - x) * torch.log(1 - x_ + EPS),
-            "gaus": -(x - x_) ** 2,
+            "gaus": -((x - x_) ** 2),
             "pois": x * torch.log(x_ + EPS) - x_,
         }
 
@@ -160,29 +160,34 @@ def loss(self, x, x_, mu_qz, logvar_qz, mu_qhx, logvar_qhx, mu_qhy, logvar_qhy,
         std_ph = torch.exp(0.5 * logvar_ph)
 
         # KL(q(h|x)||p(h|x))
-        kld_hx = -0.5 * (1 + 2.0 * torch.log(std_qhx) - (mu_qhx - mu_ph).pow(2) - std_qhx.pow(
-            2))  # assuming std_ph is 1 for now
+        kld_hx = -0.5 * (
+            1 + 2.0 * torch.log(std_qhx) - (mu_qhx - mu_ph).pow(2) - std_qhx.pow(2)
+        )  # assuming std_ph is 1 for now
         kld_hx = torch.sum(kld_hx, dim=1)
 
         # KL(q(h|x)||q(h|y))
-        kld_hy = -0.5 * (1 + 2.0 * torch.log(std_qhx) - 2.0 * torch.log(std_qhy) - (
-                    (mu_qhx - mu_qhy).pow(2) + std_qhx.pow(2)) / std_qhy.pow(2))  # assuming std_ph is 1 for now
+        kld_hy = -0.5 * (
+            1
+            + 2.0 * torch.log(std_qhx)
+            - 2.0 * torch.log(std_qhy)
+            - ((mu_qhx - mu_qhy).pow(2) + std_qhx.pow(2)) / std_qhy.pow(2)
+        )  # assuming std_ph is 1 for now
         kld_hy = torch.sum(kld_hy, dim=1)
 
         return torch.mean(beta * kld_z + alpha_1 * kld_hx + alpha_2 * kld_hy - ll)
 
 
 def learn(
-        cvae,
-        train_set,
-        n_epochs,
-        batch_size,
-        learn_rate,
-        beta,
-        alpha_1,
-        alpha_2,
-        verbose,
-        device=torch.device("cpu"),
+    cvae,
+    train_set,
+    n_epochs,
+    batch_size,
+    learn_rate,
+    beta,
+    alpha_1,
+    alpha_2,
+    verbose,
+    device=torch.device("cpu"),
 ):
     optimizer = torch.optim.Adam(params=cvae.parameters(), lr=learn_rate)
 
@@ -197,11 +202,11 @@ def learn(
         ):
             y_batch = y[u_ids, :]
             y_batch.data = np.ones(len(y_batch.data))  # Binarize data
-            y_batch = y_batch.A
+            y_batch = y_batch.toarray()
             y_batch = torch.tensor(y_batch, dtype=torch.float32, device=device)
 
             x_batch = x[u_ids, :]
-            x_batch = x_batch.A
+            x_batch = x_batch.toarray()
             x_batch = torch.tensor(x_batch, dtype=torch.float32, device=device)
 
             # Reconstructed batch
diff --git a/cornac/models/cvaecf/recom_cvaecf.py b/cornac/models/cvaecf/recom_cvaecf.py
index 30cea1a..e46c634 100644
--- a/cornac/models/cvaecf/recom_cvaecf.py
+++ b/cornac/models/cvaecf/recom_cvaecf.py
@@ -219,12 +219,12 @@ def score(self, user_idx, item_idx=None, **kwargs):
         if item_idx is None:
             y_u = self.r_mat[user_idx].copy()
             y_u.data = np.ones(len(y_u.data))
-            y_u = torch.tensor(y_u.A, dtype=torch.float32, device=self.device)
+            y_u = torch.tensor(y_u.toarray(), dtype=torch.float32, device=self.device)
             z_u, _ = self.cvae.encode_qz(y_u)
 
             x_u = self.u_adj_mat[user_idx].copy()
             x_u.data = np.ones(len(x_u.data))
-            x_u = torch.tensor(x_u.A, dtype=torch.float32, device=self.device)
+            x_u = torch.tensor(x_u.toarray(), dtype=torch.float32, device=self.device)
             h_u, _ = self.cvae.encode_qhx(x_u)
 
             known_item_scores = self.cvae.decode(z_u, h_u).data.cpu().numpy().flatten()
@@ -232,12 +232,12 @@ def score(self, user_idx, item_idx=None, **kwargs):
         else:
             y_u = self.r_mat[user_idx].copy()
             y_u.data = np.ones(len(y_u.data))
-            y_u = torch.tensor(y_u.A, dtype=torch.float32, device=self.device)
+            y_u = torch.tensor(y_u.toarray(), dtype=torch.float32, device=self.device)
             z_u, _ = self.cvae.encode_qz(y_u)
 
             x_u = self.u_adj_mat[user_idx].copy()
             x_u.data = np.ones(len(x_u.data))
-            x_u = torch.tensor(x_u.A, dtype=torch.float32, device=self.device)
+            x_u = torch.tensor(x_u.toarray(), dtype=torch.float32, device=self.device)
             h_u, _ = self.cvae.encode_qhx(x_u)
 
             user_pred = (
diff --git a/cornac/models/ease/recom_ease.py b/cornac/models/ease/recom_ease.py
index f7d7e99..73afbdb 100644
--- a/cornac/models/ease/recom_ease.py
+++ b/cornac/models/ease/recom_ease.py
@@ -123,7 +123,7 @@ def score(self, user_idx, item_idx=None, **kwargs):
         if item_idx is None:
             return self.U[user_idx, :].dot(self.B)
 
-        return self.B[item_idx, :].dot(self.U[user_idx, :])
+        return self.U[user_idx, :].dot(self.B[:, item_idx])
 
     def get_vector_measure(self):
         """Getting a valid choice of vector measurement in ANNMixin._measures.
diff --git a/cornac/models/lstur/recom_lstur.py b/cornac/models/lstur/recom_lstur.py
index e7f6c5a..73dec6d 100644
--- a/cornac/models/lstur/recom_lstur.py
+++ b/cornac/models/lstur/recom_lstur.py
@@ -10,14 +10,12 @@
 # Licensed under the MIT License.
 from ..recommender import Recommender
 import pandas as pd
-# import tensorflow.keras as keras
 import tensorflow as tf
-from tensorflow.compat.v1 import keras
+from tensorflow import keras
 from tensorflow.keras import layers
-# from tensorflow.keras.optimizers import Adam
-tf.compat.v1.disable_eager_execution()  # Force TF1.x behavior
-from cornac.utils.newsrec_utils.newsrec_utils import NewsRecUtil
 
+from cornac.utils.newsrec_utils.newsrec_utils import NewsRecUtil
+import gc
 
 import numpy as np
 from cornac.utils.newsrec_utils.layers import (
@@ -78,7 +76,7 @@ def __init__(self, wordEmb_file = None,
         Recommender.__init__(
             self, name=name, trainable=trainable, verbose=verbose, **kwargs)
         self.seed = seed 
-        tf.compat.v1.set_random_seed(seed)
+        tf.random.set_seed(seed)
         np.random.seed(seed)
 
         if word2vec_embedding is not None:
@@ -106,8 +104,6 @@ def __init__(self, wordEmb_file = None,
         self.word_emb_dim = word_emb_dim
         self.learning_rate = learning_rate
         self.dropout = dropout
-        # self.epochs = epochs
-        # self.batch_size = batch_size
         self.title_size = title_size
         self.history_size = history_size
         # self.head_num = head_num
@@ -120,27 +116,9 @@ def __init__(self, wordEmb_file = None,
         self.filter_num = filter_num
         self.type = type
 
-        self.learning_rate = learning_rate
-        self.dropout = dropout
         self.epochs = epochs
         self.batch_size = batch_size
 
-        ## set News recommendation utils
-        # self.news_organizer = NewsRecUtil(news_title =self.news_title, word_dict = self.word_dict,
-        #                              impressionRating = self.impressionRating, user_history= self.userHistory,
-        #                              history_size = self.history_size,  title_size = self.title_size)
- 
-        # session_conf = tf.ConfigProto()
-        # session_conf.gpu_options.allow_growth = True
-        # sess = tf.Session(config=session_conf)
-         ## set News recommendation utils
-        
-
-
-
-
-
-
 
     def load_dict(self, file_path):
         """load json file
@@ -363,7 +341,6 @@ def fit(self, train_set, val_set=None):
         
         Recommender.fit(self, train_set, val_set)
 
-
         self.train_set = train_set
         self.val_set = val_set
 
@@ -394,7 +371,7 @@ def fit(self, train_set, val_set=None):
                                      history_size = self.history_size,  title_size = self.title_size)
 
         # Configure GPU settings
-        gpus = tf.config.experimental.list_physical_devices("GPU")
+        gpus = tf.config.list_physical_devices("GPU")
         if gpus:
             try:
                 for gpu in gpus:
@@ -403,29 +380,25 @@ def fit(self, train_set, val_set=None):
             except RuntimeError as e:
                 print(f"GPU memory growth setting failed: {e}")
 
+
         # Build model on GPU
         # with tf.device('/GPU:1'):
         self.model, self.scorer = self._build_graph()
-        # self.model.compile(loss="categorical_crossentropy",
-        #                     optimizer=keras.optimizers.Adam(learning_rate=self.learning_rate))
-            # Compile model with Adam optimizer (TensorFlow 2.x compatible)
         self.model.compile(
         loss="categorical_crossentropy",
-        optimizer=tf.keras.optimizers.legacy.Adam(learning_rate=self.learning_rate)  # Ensure Adam is used from tf.keras.optimizers
+        optimizer= keras.optimizers.Adam(learning_rate=self.learning_rate)  
     )
         
-        # self.model, self.scorer = self._build_graph()
-
-        # self.model.compile(loss="categorical_crossentropy",
-        #                    optimizer=keras.optimizers.Adam(learning_rate=self.learning_rate))
-
-
         self.loss_log = []  # Store the loss values over epochs
         # self.click_title_all_users = {}
         for epoch in range(1, self.epochs + 1):
             step = 0
             self.current_epoch = epoch
             epoch_loss = 0
+
+            if epoch > 1 and epoch % 3 == 0:
+                gc.collect()
+            
             tqdm_util = tqdm(
                 self.news_organizer.load_data_from_file(train_set, self.npratio,self.batch_size), desc=f"Epoch {epoch}",
                 leave=False  # Removes stale progress bars
@@ -523,7 +496,7 @@ def score(self, user_idx, item_idx=None, **kwargs):
                 "item_idx should be an int, list, or numpy array")
 
 
-        batch_size = 256  # Define batch size
+        batch_size = self.batch_size  # Define batch size
         candidate_title_indexes = []
         click_title_indexes = []
         user_indexes = []
@@ -576,6 +549,8 @@ def score(self, user_idx, item_idx=None, **kwargs):
             )
 
             all_predictions.append(batch_prediction)
+            if (start // batch_size) % 8 == 0:
+                gc.collect()
             
         # Concatenate all batch predictions into a single array
         final_predictions = np.concatenate(all_predictions, axis=0)
diff --git a/cornac/models/lstur/requirements.txt b/cornac/models/lstur/requirements.txt
index a60e137..8ad4080 100644
--- a/cornac/models/lstur/requirements.txt
+++ b/cornac/models/lstur/requirements.txt
@@ -1 +1 @@
-tensorflow==2.12.0
\ No newline at end of file
+tensorflow>=2.18.0
\ No newline at end of file
diff --git a/cornac/models/mf/backend_cpu.pyx b/cornac/models/mf/backend_cpu.pyx
index 43d9010..78622be 100644
--- a/cornac/models/mf/backend_cpu.pyx
+++ b/cornac/models/mf/backend_cpu.pyx
@@ -19,7 +19,6 @@ import multiprocessing
 
 cimport cython
 from cython.parallel import prange
-from cython cimport floating, integral
 from libcpp cimport bool
 from libc.math cimport abs
 
@@ -28,27 +27,32 @@ cimport numpy as np
 from tqdm.auto import trange
 
 
+ctypedef np.int64_t INT64_t
+
+
 @cython.boundscheck(False)
 @cython.wraparound(False)
-def fit_sgd(integral[:] rid, integral[:] cid, floating[:] val,
-            floating[:, :] U, floating[:, :] V, 
-            floating[:] Bu, floating[:] Bi,
-            long num_users, long num_items,
-            floating lr, floating reg, floating mu,
+def fit_sgd(INT64_t[:] rid, INT64_t[:] cid, float[:] val,
+            float[:, :] U, float[:, :] V, 
+            float[:] Bu, float[:] Bi,
+            float lr, float reg, float mu,
             int max_iter, int num_threads,
             bool use_bias, bool early_stop, bool verbose):
     """Fit the model parameters (U, V, Bu, Bi) with SGD"""
     cdef:
-        long num_ratings = val.shape[0]
+        INT64_t num_ratings = val.shape[0]
+        INT64_t u, i, j
+
         int num_factors = U.shape[1]
+        int f
 
-        floating loss = 0
-        floating last_loss = 0
-        floating r, r_pred, error, u_f, i_f, delta_loss
-        integral u, i, f, j
+        float loss = 0
+        float last_loss = 0
+        float r, r_pred, error, u_f, i_f, delta_loss
+        
 
-        floating * user
-        floating * item
+        float * user
+        float * item
 
     progress = trange(max_iter, disable=not verbose)
     for epoch in progress:
diff --git a/cornac/models/mf/recom_mf.py b/cornac/models/mf/recom_mf.py
index 7d83185..f654124 100644
--- a/cornac/models/mf/recom_mf.py
+++ b/cornac/models/mf/recom_mf.py
@@ -26,6 +26,9 @@
 from ...utils.init_utils import normal, zeros
 
 
+DTYPE = np.float32
+
+
 class MF(Recommender, ANNMixin):
     """Matrix Factorization.
 
@@ -137,20 +140,20 @@ def _init(self):
 
         if self.u_factors is None:
             self.u_factors = normal(
-                [self.num_users, self.k], std=0.01, random_state=rng
+                [self.num_users, self.k], std=0.01, random_state=rng, dtype=DTYPE
             )
         if self.i_factors is None:
             self.i_factors = normal(
-                [self.num_items, self.k], std=0.01, random_state=rng
+                [self.num_items, self.k], std=0.01, random_state=rng, dtype=DTYPE
             )
 
         self.u_biases = (
-            zeros(self.num_users) if self.u_biases is None else self.u_biases
+            zeros(self.num_users, dtype=DTYPE) if self.u_biases is None else self.u_biases
         )
         self.i_biases = (
-            zeros(self.num_items) if self.i_biases is None else self.i_biases
+            zeros(self.num_items, dtype=DTYPE) if self.i_biases is None else self.i_biases
         )
-        self.global_mean = self.global_mean if self.use_bias else 0.0
+        self.global_mean = np.dtype(DTYPE).type(self.global_mean if self.use_bias else 0.0)
 
     def fit(self, train_set, val_set=None):
         """Fit the model to observations.
@@ -190,13 +193,11 @@ def _fit_cpu(self, train_set, val_set):
         backend_cpu.fit_sgd(
             rid,
             cid,
-            val.astype(np.float32),
+            val.astype(DTYPE),
             self.u_factors,
             self.i_factors,
             self.u_biases,
             self.i_biases,
-            self.num_users,
-            self.num_items,
             self.learning_rate,
             self.lambda_reg,
             self.global_mean,
diff --git a/cornac/models/ncf/backend_tf.py b/cornac/models/ncf/backend_tf.py
index 2cf0c59..0ff2bcc 100644
--- a/cornac/models/ncf/backend_tf.py
+++ b/cornac/models/ncf/backend_tf.py
@@ -13,15 +13,8 @@
 # limitations under the License.
 # ============================================================================
 
-import warnings
 
-# disable annoying tensorflow deprecated API warnings
-warnings.filterwarnings("ignore", category=UserWarning)
-
-import tensorflow.compat.v1 as tf
-
-tf.logging.set_verbosity(tf.logging.ERROR)
-tf.disable_v2_behavior()
+import tensorflow as tf
 
 
 act_functions = {
@@ -35,88 +28,98 @@
 }
 
 
-def loss_fn(labels, logits):
-    cross_entropy = tf.reduce_mean(
-        tf.nn.sigmoid_cross_entropy_with_logits(labels=labels, logits=logits)
-    )
-    reg_loss = tf.losses.get_regularization_loss()
-    return cross_entropy + reg_loss
-
-
-def train_fn(loss, learning_rate, learner):
+def get_optimizer(learning_rate, learner):
     if learner.lower() == "adagrad":
-        opt = tf.train.AdagradOptimizer(learning_rate=learning_rate, name="optimizer")
+        return tf.keras.optimizers.Adagrad(learning_rate=learning_rate)
     elif learner.lower() == "rmsprop":
-        opt = tf.train.RMSPropOptimizer(learning_rate=learning_rate, name="optimizer")
+        return tf.keras.optimizers.RMSprop(learning_rate=learning_rate)
     elif learner.lower() == "adam":
-        opt = tf.train.AdamOptimizer(learning_rate=learning_rate, name="optimizer")
+        return tf.keras.optimizers.Adam(learning_rate=learning_rate)
     else:
-        opt = tf.train.GradientDescentOptimizer(
-            learning_rate=learning_rate, name="optimizer"
-        )
-
-    return opt.minimize(loss)
-
-
-def emb(
-    uid, iid, num_users, num_items, emb_size, reg_user, reg_item, seed=None, scope="emb"
-):
-    with tf.variable_scope(scope):
-        user_emb = tf.get_variable(
-            "user_emb",
-            shape=[num_users, emb_size],
-            dtype=tf.float32,
-            initializer=tf.random_normal_initializer(stddev=0.01, seed=seed),
-            regularizer=tf.keras.regularizers.L2(reg_user),
+        return tf.keras.optimizers.SGD(learning_rate=learning_rate)
+
+
+class GMFLayer(tf.keras.layers.Layer):
+    def __init__(self, num_users, num_items, emb_size, reg_user, reg_item, seed=None, **kwargs):
+        super(GMFLayer, self).__init__(**kwargs)
+        self.num_users = num_users
+        self.num_items = num_items
+        self.emb_size = emb_size
+        self.reg_user = reg_user
+        self.reg_item = reg_item
+        self.seed = seed
+        
+        # Initialize embeddings
+        self.user_embedding = tf.keras.layers.Embedding(
+            num_users,
+            emb_size,
+            embeddings_initializer=tf.keras.initializers.RandomNormal(stddev=0.01, seed=seed),
+            embeddings_regularizer=tf.keras.regularizers.L2(reg_user),
+            name="user_embedding"
         )
-        item_emb = tf.get_variable(
-            "item_emb",
-            shape=[num_items, emb_size],
-            dtype=tf.float32,
-            initializer=tf.random_normal_initializer(stddev=0.01, seed=seed),
-            regularizer=tf.keras.regularizers.L2(reg_item),
-        )
-
-    return tf.nn.embedding_lookup(user_emb, uid), tf.nn.embedding_lookup(item_emb, iid)
-
-
-def gmf(uid, iid, num_users, num_items, emb_size, reg_user, reg_item, seed=None):
-    with tf.variable_scope("GMF") as scope:
-        user_emb, item_emb = emb(
-            uid=uid,
-            iid=iid,
-            num_users=num_users,
-            num_items=num_items,
-            emb_size=emb_size,
-            reg_user=reg_user,
-            reg_item=reg_item,
-            seed=seed,
-            scope=scope,
+        
+        self.item_embedding = tf.keras.layers.Embedding(
+            num_items,
+            emb_size,
+            embeddings_initializer=tf.keras.initializers.RandomNormal(stddev=0.01, seed=seed),
+            embeddings_regularizer=tf.keras.regularizers.L2(reg_item),
+            name="item_embedding"
         )
+    
+    def call(self, inputs):
+        user_ids, item_ids = inputs
+        user_emb = self.user_embedding(user_ids)
+        item_emb = self.item_embedding(item_ids)
         return tf.multiply(user_emb, item_emb)
 
 
-def mlp(uid, iid, num_users, num_items, layers, reg_layers, act_fn, seed=None):
-    with tf.variable_scope("MLP") as scope:
-        user_emb, item_emb = emb(
-            uid=uid,
-            iid=iid,
-            num_users=num_users,
-            num_items=num_items,
-            emb_size=int(layers[0] / 2),
-            reg_user=reg_layers[0],
-            reg_item=reg_layers[0],
-            seed=seed,
-            scope=scope,
+class MLPLayer(tf.keras.layers.Layer):
+    def __init__(self, num_users, num_items, layers, reg_layers, act_fn, seed=None, **kwargs):
+        super(MLPLayer, self).__init__(**kwargs)
+        self.num_users = num_users
+        self.num_items = num_items
+        self.layers = layers
+        self.reg_layers = reg_layers
+        self.act_fn = act_fn
+        self.seed = seed
+        
+        # Initialize embeddings
+        self.user_embedding = tf.keras.layers.Embedding(
+            num_users,
+            int(layers[0] / 2),
+            embeddings_initializer=tf.keras.initializers.RandomNormal(stddev=0.01, seed=seed),
+            embeddings_regularizer=tf.keras.regularizers.L2(reg_layers[0]),
+            name="user_embedding"
         )
-        interaction = tf.concat([user_emb, item_emb], axis=-1)
-        for i, layer in enumerate(layers[1:]):
-            interaction = tf.layers.dense(
-                interaction,
-                units=layer,
-                name="layer{}".format(i + 1),
-                activation=act_functions.get(act_fn, tf.nn.relu),
-                kernel_initializer=tf.initializers.lecun_uniform(seed),
-                kernel_regularizer=tf.keras.regularizers.L2(reg_layers[i + 1]),
+        
+        self.item_embedding = tf.keras.layers.Embedding(
+            num_items,
+            int(layers[0] / 2),
+            embeddings_initializer=tf.keras.initializers.RandomNormal(stddev=0.01, seed=seed),
+            embeddings_regularizer=tf.keras.regularizers.L2(reg_layers[0]),
+            name="item_embedding"
+        )
+        
+        # Define dense layers
+        self.dense_layers = []
+        for i, layer_size in enumerate(layers[1:]):
+            self.dense_layers.append(
+                tf.keras.layers.Dense(
+                    layer_size,
+                    activation=act_functions.get(act_fn, tf.nn.relu),
+                    kernel_initializer=tf.keras.initializers.LecunUniform(seed=seed),
+                    kernel_regularizer=tf.keras.regularizers.L2(reg_layers[i + 1]),
+                    name=f"layer{i+1}"
+                )
             )
+    
+    def call(self, inputs):
+        user_ids, item_ids = inputs
+        user_emb = self.user_embedding(user_ids)
+        item_emb = self.item_embedding(item_ids)
+        interaction = tf.concat([user_emb, item_emb], axis=-1)
+        
+        for layer in self.dense_layers:
+            interaction = layer(interaction)
+            
         return interaction
diff --git a/cornac/models/ncf/recom_gmf.py b/cornac/models/ncf/recom_gmf.py
index f55ec7e..7b1a6c3 100644
--- a/cornac/models/ncf/recom_gmf.py
+++ b/cornac/models/ncf/recom_gmf.py
@@ -111,55 +111,45 @@ def __init__(
     ########################
     ## TensorFlow backend ##
     ########################
-    def _build_graph_tf(self):
-        import tensorflow.compat.v1 as tf
-        from .backend_tf import gmf, loss_fn, train_fn
-
-        self.graph = tf.Graph()
-        with self.graph.as_default():
-            tf.set_random_seed(self.seed)
-
-            self.user_id = tf.placeholder(shape=[None], dtype=tf.int32, name="user_id")
-            self.item_id = tf.placeholder(shape=[None], dtype=tf.int32, name="item_id")
-            self.labels = tf.placeholder(
-                shape=[None, 1], dtype=tf.float32, name="labels"
-            )
-
-            self.interaction = gmf(
-                uid=self.user_id,
-                iid=self.item_id,
-                num_users=self.num_users,
-                num_items=self.num_items,
-                emb_size=self.num_factors,
-                reg_user=self.reg,
-                reg_item=self.reg,
-                seed=self.seed,
-            )
-
-            logits = tf.layers.dense(
-                self.interaction,
-                units=1,
-                name="logits",
-                kernel_initializer=tf.initializers.lecun_uniform(self.seed),
-            )
-            self.prediction = tf.nn.sigmoid(logits)
-
-            self.loss = loss_fn(labels=self.labels, logits=logits)
-            self.train_op = train_fn(
-                self.loss, learning_rate=self.lr, learner=self.learner
-            )
-
-            self.initializer = tf.global_variables_initializer()
-            self.saver = tf.train.Saver()
-
-        self._sess_init_tf()
-
-    def _score_tf(self, user_idx, item_idx):
-        feed_dict = {
-            self.user_id: [user_idx],
-            self.item_id: np.arange(self.num_items) if item_idx is None else [item_idx],
-        }
-        return self.sess.run(self.prediction, feed_dict=feed_dict)
+    def _build_model_tf(self):
+        import tensorflow as tf
+        from .backend_tf import GMFLayer
+        
+        # Define inputs
+        user_input = tf.keras.layers.Input(shape=(1,), dtype=tf.int32, name="user_input")
+        item_input = tf.keras.layers.Input(shape=(1,), dtype=tf.int32, name="item_input")
+        
+        # GMF layer
+        gmf_layer = GMFLayer(
+            num_users=self.num_users,
+            num_items=self.num_items,
+            emb_size=self.num_factors,
+            reg_user=self.reg,
+            reg_item=self.reg,
+            seed=self.seed,
+            name="gmf_layer"
+        )
+        
+        # Get embeddings and element-wise product
+        gmf_vector = gmf_layer([user_input, item_input])
+        
+        # Output layer
+        logits = tf.keras.layers.Dense(
+            1,
+            kernel_initializer=tf.keras.initializers.LecunUniform(seed=self.seed),
+            name="logits"
+        )(gmf_vector)
+        
+        prediction = tf.keras.layers.Activation('sigmoid', name="prediction")(logits)
+        
+        # Create model with both logits and prediction outputs
+        model = tf.keras.Model(
+            inputs=[user_input, item_input],
+            outputs=prediction,
+            name="GMF"
+        )
+        
+        return model
 
     #####################
     ## PyTorch backend ##
diff --git a/cornac/models/ncf/recom_mlp.py b/cornac/models/ncf/recom_mlp.py
index 6901b91..3b2f688 100644
--- a/cornac/models/ncf/recom_mlp.py
+++ b/cornac/models/ncf/recom_mlp.py
@@ -116,60 +116,45 @@ def __init__(
     ########################
     ## TensorFlow backend ##
     ########################
-    def _build_graph_tf(self):
-        import tensorflow.compat.v1 as tf
-        from .backend_tf import mlp, loss_fn, train_fn
-
-        self.graph = tf.Graph()
-        with self.graph.as_default():
-            tf.set_random_seed(self.seed)
-
-            self.user_id = tf.placeholder(shape=[None], dtype=tf.int32, name="user_id")
-            self.item_id = tf.placeholder(shape=[None], dtype=tf.int32, name="item_id")
-            self.labels = tf.placeholder(
-                shape=[None, 1], dtype=tf.float32, name="labels"
-            )
-
-            self.interaction = mlp(
-                uid=self.user_id,
-                iid=self.item_id,
-                num_users=self.num_users,
-                num_items=self.num_items,
-                layers=self.layers,
-                reg_layers=[self.reg] * len(self.layers),
-                act_fn=self.act_fn,
-                seed=self.seed,
-            )
-            logits = tf.layers.dense(
-                self.interaction,
-                units=1,
-                name="logits",
-                kernel_initializer=tf.initializers.lecun_uniform(self.seed),
-            )
-            self.prediction = tf.nn.sigmoid(logits)
-
-            self.loss = loss_fn(labels=self.labels, logits=logits)
-            self.train_op = train_fn(
-                self.loss, learning_rate=self.lr, learner=self.learner
-            )
-
-            self.initializer = tf.global_variables_initializer()
-            self.saver = tf.train.Saver()
-
-        self._sess_init_tf()
-
-    def _score_tf(self, user_idx, item_idx):
-        if item_idx is None:
-            feed_dict = {
-                self.user_id: np.ones(self.num_items) * user_idx,
-                self.item_id: np.arange(self.num_items),
-            }
-        else:
-            feed_dict = {
-                self.user_id: [user_idx],
-                self.item_id: [item_idx],
-            }
-        return self.sess.run(self.prediction, feed_dict=feed_dict)
+    def _build_model_tf(self):
+        import tensorflow as tf
+        from .backend_tf import MLPLayer
+        
+        # Define inputs
+        user_input = tf.keras.layers.Input(shape=(1,), dtype=tf.int32, name="user_input")
+        item_input = tf.keras.layers.Input(shape=(1,), dtype=tf.int32, name="item_input")
+        
+        # MLP layer
+        mlp_layer = MLPLayer(
+            num_users=self.num_users,
+            num_items=self.num_items,
+            layers=self.layers,
+            reg_layers=[self.reg] * len(self.layers),
+            act_fn=self.act_fn,
+            seed=self.seed,
+            name="mlp_layer"
+        )
+        
+        # Get MLP vector
+        mlp_vector = mlp_layer([user_input, item_input])
+        
+        # Output layer
+        logits = tf.keras.layers.Dense(
+            1,
+            kernel_initializer=tf.keras.initializers.LecunUniform(seed=self.seed),
+            name="logits"
+        )(mlp_vector)
+        
+        prediction = tf.keras.layers.Activation('sigmoid', name="prediction")(logits)
+        
+        # Create model
+        model = tf.keras.Model(
+            inputs=[user_input, item_input],
+            outputs=prediction,
+            name="MLP"
+        )
+        
+        return model
 
     #####################
     ## PyTorch backend ##
diff --git a/cornac/models/ncf/recom_ncf_base.py b/cornac/models/ncf/recom_ncf_base.py
index 1a75ddb..1fc97d4 100644
--- a/cornac/models/ncf/recom_ncf_base.py
+++ b/cornac/models/ncf/recom_ncf_base.py
@@ -14,14 +14,12 @@
 # ============================================================================
 
 
-import numpy as np
 import numpy as np
 from tqdm.auto import trange
 
 from ..recommender import Recommender
 from ...utils import get_rng
 from ...exception import ScoreException
-from ...exception import ScoreException
 
 
 class NCFBase(Recommender):
@@ -143,33 +141,34 @@ def fit(self, train_set, val_set=None):
     ########################
     ## TensorFlow backend ##
     ########################
-    def _build_graph_tf(self):
+    def _build_model_tf(self):
         raise NotImplementedError()
-    
-    def _build_graph(self):
-        import tensorflow.compat.v1 as tf
-
-        self.graph = tf.Graph()
-
-    def _sess_init_tf(self):
-        import tensorflow.compat.v1 as tf
-
-        config = tf.ConfigProto()
-        config.gpu_options.allow_growth = True
-        self.sess = tf.Session(graph=self.graph, config=config)
-        self.sess.run(self.initializer)
-
-    def _get_feed_dict(self, batch_users, batch_items, batch_ratings):
-        return {
-            self.user_id: batch_users,
-            self.item_id: batch_items,
-            self.labels: batch_ratings.reshape(-1, 1),
-        }
 
     def _fit_tf(self, train_set, val_set):
-        if not hasattr(self, "graph"):
-            self._build_graph_tf()
-
+        import tensorflow as tf
+        
+        # Set random seed for reproducibility
+        if self.seed is not None:
+            tf.random.set_seed(self.seed)
+            np.random.seed(self.seed)
+        
+        # Configure GPU memory growth to avoid OOM errors
+        gpus = tf.config.experimental.list_physical_devices('GPU')
+        if gpus:
+            try:
+                for gpu in gpus:
+                    tf.config.experimental.set_memory_growth(gpu, True)
+            except RuntimeError as e:
+                print(e)
+        
+        # Build the model
+        self.model = self._build_model_tf()
+        
+        # Get optimizer
+        from .backend_tf import get_optimizer
+        optimizer = get_optimizer(learning_rate=self.lr, learner=self.learner)
+        
+        # Training loop
         loop = trange(self.num_epochs, disable=not self.verbose)
         for _ in loop:
             count = 0
@@ -179,17 +178,33 @@ def _fit_tf(self, train_set, val_set):
                     self.batch_size, shuffle=True, binary=True, num_zeros=self.num_neg
                 )
             ):
-                _, _loss = self.sess.run(
-                    [self.train_op, self.loss],
-                    feed_dict=self._get_feed_dict(
-                        batch_users, batch_items, batch_ratings
-                    ),
-                )
+                batch_ratings = batch_ratings.reshape(-1, 1, 1)
+                
+                # Convert to tensors
+                batch_users = tf.convert_to_tensor(batch_users, dtype=tf.int32)
+                batch_items = tf.convert_to_tensor(batch_items, dtype=tf.int32)
+                batch_ratings = tf.convert_to_tensor(batch_ratings, dtype=tf.float32)
+                
+                # Training step
+                with tf.GradientTape() as tape:
+                    predictions = self.model([batch_users, batch_items], training=True)
+                    cross_entropy = tf.keras.losses.binary_crossentropy(
+                        y_true=batch_ratings,
+                        y_pred=predictions,
+                        from_logits=False  # predictions are already probabilities
+                    )
+                    cross_entropy = tf.reduce_mean(cross_entropy)
+                    loss_value = cross_entropy + tf.reduce_sum(self.model.losses)
+                    
+                # Apply gradients
+                grads = tape.gradient(loss_value, self.model.trainable_variables)
+                optimizer.apply_gradients(zip(grads, self.model.trainable_variables))
+                
                 count += len(batch_users)
-                sum_loss += len(batch_users) * _loss
+                sum_loss += len(batch_users) * loss_value.numpy()
                 if i % 10 == 0:
                     loop.set_postfix(loss=(sum_loss / count))
-
+            
             if self.early_stopping is not None and self.early_stop(
                 train_set, val_set, **self.early_stopping
             ):
@@ -197,7 +212,24 @@ def _fit_tf(self, train_set, val_set):
         loop.close()
 
     def _score_tf(self, user_idx, item_idx):
-        raise NotImplementedError()
+        """Score function for TensorFlow models."""
+        import tensorflow as tf
+        
+        if item_idx is None:
+            # Score all items for a given user
+            user_tensor = tf.convert_to_tensor([user_idx], dtype=tf.int32)
+            item_tensor = tf.convert_to_tensor(np.arange(self.num_items), dtype=tf.int32)
+            
+            # Broadcast user_idx to match the shape of item_tensor
+            user_tensor = tf.broadcast_to(user_tensor, shape=item_tensor.shape)
+        else:
+            # Score a specific item for a given user
+            user_tensor = tf.convert_to_tensor([user_idx], dtype=tf.int32)
+            item_tensor = tf.convert_to_tensor([item_idx], dtype=tf.int32)
+        
+        # Get predictions
+        predictions = self.model([user_tensor, item_tensor], training=False)
+        return predictions.numpy().squeeze()
 
     #####################
     ## PyTorch backend ##
@@ -278,7 +310,9 @@ def save(self, save_dir=None):
         model_file = Recommender.save(self, save_dir)
 
         if self.backend == "tensorflow":
-            self.saver.save(self.sess, model_file.replace(".pkl", ".cpt"))
+            # Save the TensorFlow model
+            if hasattr(self, "model"):
+                self.model.save_weights(model_file.replace(".pkl", ".h5"))
         elif self.backend == "pytorch":
             # TODO: implement model saving for PyTorch
             raise NotImplementedError()
@@ -308,8 +342,10 @@ def load(model_path, trainable=False):
             model.pretrained = False
 
         if model.backend == "tensorflow":
-            model._build_graph()
-            model.saver.restore(model.sess, model.load_from.replace(".pkl", ".cpt"))
+            # Build the model
+            model.model = model._build_model_tf()
+            # Load weights
+            model.model.load_weights(model.load_from.replace(".pkl", ".h5"))
         elif model.backend == "pytorch":
             # TODO: implement model loading for PyTorch
             raise NotImplementedError()
diff --git a/cornac/models/ncf/recom_neumf.py b/cornac/models/ncf/recom_neumf.py
index 760048d..8e3f9ff 100644
--- a/cornac/models/ncf/recom_neumf.py
+++ b/cornac/models/ncf/recom_neumf.py
@@ -157,121 +157,102 @@ def from_pretrained(self, pretrained_gmf, pretrained_mlp, alpha=0.5):
     ########################
     ## TensorFlow backend ##
     ########################
-    def _build_graph_tf(self):
-        import tensorflow.compat.v1 as tf
-        from .backend_tf import gmf, mlp, loss_fn, train_fn
-
-        self.graph = tf.Graph()
-        with self.graph.as_default():
-            tf.set_random_seed(self.seed)
-
-            self.gmf_user_id = tf.placeholder(
-                shape=[None], dtype=tf.int32, name="gmf_user_id"
-            )
-            self.mlp_user_id = tf.placeholder(
-                shape=[None], dtype=tf.int32, name="mlp_user_id"
-            )
-            self.item_id = tf.placeholder(shape=[None], dtype=tf.int32, name="item_id")
-            self.labels = tf.placeholder(
-                shape=[None, 1], dtype=tf.float32, name="labels"
-            )
-
-            gmf_feat = gmf(
-                uid=self.gmf_user_id,
-                iid=self.item_id,
-                num_users=self.num_users,
-                num_items=self.num_items,
-                emb_size=self.num_factors,
-                reg_user=self.reg,
-                reg_item=self.reg,
-                seed=self.seed,
-            )
-            mlp_feat = mlp(
-                uid=self.mlp_user_id,
-                iid=self.item_id,
-                num_users=self.num_users,
-                num_items=self.num_items,
-                layers=self.layers,
-                reg_layers=[self.reg] * len(self.layers),
-                act_fn=self.act_fn,
-                seed=self.seed,
-            )
-
-            self.interaction = tf.concat([gmf_feat, mlp_feat], axis=-1)
-            logits = tf.layers.dense(
-                self.interaction,
-                units=1,
-                name="logits",
-                kernel_initializer=tf.initializers.lecun_uniform(self.seed),
-            )
-            self.prediction = tf.nn.sigmoid(logits)
-
-            self.loss = loss_fn(labels=self.labels, logits=logits)
-            self.train_op = train_fn(
-                self.loss, learning_rate=self.lr, learner=self.learner
-            )
-
-            self.initializer = tf.global_variables_initializer()
-            self.saver = tf.train.Saver()
-
-        self._sess_init_tf()
-
+    def _build_model_tf(self):
+        import tensorflow as tf
+        from .backend_tf import GMFLayer, MLPLayer
+        
+        # Define inputs
+        user_input = tf.keras.layers.Input(shape=(1,), dtype=tf.int32, name="user_input")
+        item_input = tf.keras.layers.Input(shape=(1,), dtype=tf.int32, name="item_input")
+        
+        # GMF layer
+        gmf_layer = GMFLayer(
+            num_users=self.num_users,
+            num_items=self.num_items,
+            emb_size=self.num_factors,
+            reg_user=self.reg,
+            reg_item=self.reg,
+            seed=self.seed,
+            name="gmf_layer"
+        )
+        
+        # MLP layer
+        mlp_layer = MLPLayer(
+            num_users=self.num_users,
+            num_items=self.num_items,
+            layers=self.layers,
+            reg_layers=[self.reg] * len(self.layers),
+            act_fn=self.act_fn,
+            seed=self.seed,
+            name="mlp_layer"
+        )
+        
+        # Get embeddings and element-wise product
+        gmf_vector = gmf_layer([user_input, item_input])
+        mlp_vector = mlp_layer([user_input, item_input])
+        
+        # Concatenate GMF and MLP vectors
+        concat_vector = tf.keras.layers.Concatenate(axis=-1)([gmf_vector, mlp_vector])
+        
+        # Output layer
+        logits = tf.keras.layers.Dense(
+            1,
+            kernel_initializer=tf.keras.initializers.LecunUniform(seed=self.seed),
+            name="logits"
+        )(concat_vector)
+        
+        prediction = tf.keras.layers.Activation('sigmoid', name="prediction")(logits)
+        
+        # Create model
+        model = tf.keras.Model(
+            inputs=[user_input, item_input],
+            outputs=prediction,
+            name="NeuMF"
+        )
+        
+        # Handle pretrained models
         if self.pretrained:
-            gmf_kernel = self.pretrained_gmf.sess.run(
-                self.pretrained_gmf.sess.graph.get_tensor_by_name("logits/kernel:0")
+            # Get GMF and MLP models
+            gmf_model = self.pretrained_gmf.model
+            mlp_model = self.pretrained_mlp.model
+            
+            # Copy GMF embeddings
+            model.get_layer('gmf_layer').user_embedding.set_weights(
+                gmf_model.get_layer('gmf_layer').user_embedding.get_weights()
             )
-            gmf_bias = self.pretrained_gmf.sess.run(
-                self.pretrained_gmf.sess.graph.get_tensor_by_name("logits/bias:0")
+            model.get_layer('gmf_layer').item_embedding.set_weights(
+                gmf_model.get_layer('gmf_layer').item_embedding.get_weights()
             )
-            mlp_kernel = self.pretrained_mlp.sess.run(
-                self.pretrained_mlp.sess.graph.get_tensor_by_name("logits/kernel:0")
+            
+            # Copy MLP embeddings and layers
+            model.get_layer('mlp_layer').user_embedding.set_weights(
+                mlp_model.get_layer('mlp_layer').user_embedding.get_weights()
             )
-            mlp_bias = self.pretrained_mlp.sess.run(
-                self.pretrained_mlp.sess.graph.get_tensor_by_name("logits/bias:0")
+            model.get_layer('mlp_layer').item_embedding.set_weights(
+                mlp_model.get_layer('mlp_layer').item_embedding.get_weights()
             )
-            logits_kernel = np.concatenate(
-                [self.alpha * gmf_kernel, (1 - self.alpha) * mlp_kernel]
-            )
-            logits_bias = self.alpha * gmf_bias + (1 - self.alpha) * mlp_bias
-
-            for v in self.graph.get_collection(tf.GraphKeys.TRAINABLE_VARIABLES):
-                if v.name.startswith("GMF"):
-                    sess = self.pretrained_gmf.sess
-                    self.sess.run(
-                        tf.assign(v, sess.run(sess.graph.get_tensor_by_name(v.name)))
-                    )
-                elif v.name.startswith("MLP"):
-                    sess = self.pretrained_mlp.sess
-                    self.sess.run(
-                        tf.assign(v, sess.run(sess.graph.get_tensor_by_name(v.name)))
-                    )
-                elif v.name.startswith("logits/kernel"):
-                    self.sess.run(tf.assign(v, logits_kernel))
-                elif v.name.startswith("logits/bias"):
-                    self.sess.run(tf.assign(v, logits_bias))
-
-    def _get_feed_dict(self, batch_users, batch_items, batch_ratings):
-        return {
-            self.gmf_user_id: batch_users,
-            self.mlp_user_id: batch_users,
-            self.item_id: batch_items,
-            self.labels: batch_ratings.reshape(-1, 1),
-        }
-
-    def _score_tf(self, user_idx, item_idx):
-        if item_idx is None:
-            feed_dict = {
-                self.gmf_user_id: [user_idx],
-                self.mlp_user_id: np.ones(self.num_items) * user_idx,
-                self.item_id: np.arange(self.num_items),
-            }
-        else:
-            feed_dict = {
-                self.gmf_user_id: [user_idx],
-                self.mlp_user_id: [user_idx],
-                self.item_id: [item_idx],
-            }
-        return self.sess.run(self.prediction, feed_dict=feed_dict)
+            
+            # Copy dense layers in MLP
+            for i, layer in enumerate(model.get_layer('mlp_layer').dense_layers):
+                layer.set_weights(mlp_model.get_layer('mlp_layer').dense_layers[i].get_weights())
+            
+            # Combine weights for output layer
+            gmf_logits_weights = gmf_model.get_layer('logits').get_weights()
+            mlp_logits_weights = mlp_model.get_layer('logits').get_weights()
+            
+            # Combine kernel weights
+            combined_kernel = np.concatenate([
+                self.alpha * gmf_logits_weights[0],
+                (1.0 - self.alpha) * mlp_logits_weights[0]
+            ], axis=0)
+            
+            # Combine bias weights
+            combined_bias = self.alpha * gmf_logits_weights[1] + (1.0 - self.alpha) * mlp_logits_weights[1]
+            
+            # Set combined weights to output layer
+            model.get_layer('logits').set_weights([combined_kernel, combined_bias])
+        
+        return model
 
     #####################
     ## PyTorch backend ##
diff --git a/cornac/models/ncf/requirements.txt b/cornac/models/ncf/requirements.txt
index 71cfbab..eaabc09 100644
--- a/cornac/models/ncf/requirements.txt
+++ b/cornac/models/ncf/requirements.txt
@@ -1,3 +1,2 @@
-tensorflow==2.12.0
+tensorflow>=2.12.0
 torch>=0.4.1
-tensorflow==2.12.0
\ No newline at end of file
diff --git a/cornac/models/npa/recom_npa.py b/cornac/models/npa/recom_npa.py
index c1ccc9b..c8506fe 100644
--- a/cornac/models/npa/recom_npa.py
+++ b/cornac/models/npa/recom_npa.py
@@ -7,17 +7,17 @@
 import re
 import json
 import tensorflow as tf
-from tensorflow.compat.v1 import keras
-tf.compat.v1.disable_eager_execution()
+from tensorflow import keras
 from tensorflow.keras import layers
 import numpy as np
 from cornac.utils.newsrec_utils.layers import PersonalizedAttentivePooling
 from cornac.utils.newsrec_utils.newsrec_utils import NewsRecUtil
 import pandas as pd
 from tqdm.auto import tqdm
-# tf.compat.v1.disable_eager_execution()
+
 import os
 import pickle
+import gc 
 
 class NPA(Recommender):
     """NPA model(Neural News Recommendation with Attentive Multi-View Learning)
@@ -69,7 +69,8 @@ def __init__(self,
         Recommender.__init__(
             self, name=name, trainable=trainable, verbose=verbose,  **kwargs)
         self.seed = seed
-        tf.compat.v1.set_random_seed(seed)
+        tf.random.set_seed(seed)
+        np.random.seed(seed)
         if word2vec_embedding is not None:
             self.word2vec_embedding = word2vec_embedding  # Load directly from params
         else:
@@ -110,15 +111,7 @@ def __init__(self,
         self.epochs = epochs
         self.batch_size = batch_size
 
-        ## set News recommendation utils
-        # self.news_organizer = NewsRecUtil(news_title =self.news_title, word_dict = self.word_dict,
-        #                              impressionRating = self.impressionRating, user_history= self.userHistory,
-        #                              history_size = self.history_size,  title_size = self.title_size)
-
 
-        # session_conf = tf.ConfigProto()
-        # session_conf.gpu_options.allow_growth = True
-        # sess = tf.Session(config=session_conf)
 
 
 
@@ -392,7 +385,7 @@ def fit(self, train_set, val_set=None):
 
         
         # Configure GPU settings
-        gpus = tf.config.experimental.list_physical_devices("GPU")
+        gpus = tf.config.list_physical_devices("GPU")
         if gpus:
             try:
                 for gpu in gpus:
@@ -404,9 +397,10 @@ def fit(self, train_set, val_set=None):
         # Build model on GPU
         # with tf.device('/GPU:3'):
         self.model, self.scorer = self._build_graph()
+        # self.model.compile(loss="categorical_crossentropy",
+        #                     optimizer=tf.keras.optimizers.legacy.Adam(learning_rate=self.learning_rate))
         self.model.compile(loss="categorical_crossentropy",
-                            optimizer=tf.keras.optimizers.legacy.Adam(learning_rate=self.learning_rate))
-
+                            optimizer= keras.optimizers.Adam(learning_rate=self.learning_rate))
         # self.model, self.scorer = self._build_graph()
 
         # self.model.compile(loss="categorical_crossentropy",
@@ -428,6 +422,8 @@ def fit(self, train_set, val_set=None):
             step = 0
             self.current_epoch = epoch
             epoch_loss = 0
+            if epoch > 1 and epoch % 3 == 0:
+                gc.collect()
 
             tqdm_util = tqdm(
                 self.news_organizer.load_data_from_file(train_set, self.npratio,self.batch_size), desc=f"Epoch {epoch}",
@@ -517,7 +513,7 @@ def score(self, user_idx, item_idx=None, **kwargs):
             raise Exception(
                 "item_idx should be an int, list, or numpy array")
         
-        batch_size = 256
+        batch_size = self.batch_size
         candidate_title_indexes = []
         click_title_indexes = []
         user_indexes = []
@@ -571,6 +567,8 @@ def score(self, user_idx, item_idx=None, **kwargs):
             )
 
             all_predictions.append(batch_prediction)
+            if (start // batch_size) % 8 == 0:
+                gc.collect()
 
         # Concatenate all batch predictions into a single array
         
@@ -713,7 +711,7 @@ def load_npa(cls, save_dir):
         # Compile the model with the stored learning rate
         model.model.compile(
             loss="categorical_crossentropy",
-            optimizer=tf.keras.optimizers.legacy.Adam(learning_rate=model.learning_rate)
+            optimizer= keras.optimizers.Adam(learning_rate=model.learning_rate)
         )
 
         #################
diff --git a/cornac/models/npa/requirements.txt b/cornac/models/npa/requirements.txt
index a60e137..8ad4080 100644
--- a/cornac/models/npa/requirements.txt
+++ b/cornac/models/npa/requirements.txt
@@ -1 +1 @@
-tensorflow==2.12.0
\ No newline at end of file
+tensorflow>=2.18.0
\ No newline at end of file
diff --git a/cornac/models/nrms/recom_nrms.py b/cornac/models/nrms/recom_nrms.py
index 4a6898b..f9ab4b5 100644
--- a/cornac/models/nrms/recom_nrms.py
+++ b/cornac/models/nrms/recom_nrms.py
@@ -13,10 +13,8 @@
 
 from tqdm.auto import trange
 from ..recommender import Recommender
-# import tensorflow.keras as keras
 import tensorflow as tf
-from tensorflow.compat.v1 import keras
-tf.compat.v1.disable_eager_execution()
+from tensorflow import keras
 from tensorflow.keras import layers
 from cornac.utils.newsrec_utils.layers import AttLayer2, SelfAttention
 from cornac.utils.newsrec_utils.newsrec_utils import NewsRecUtil
@@ -29,7 +27,7 @@
 import json
 import os
 import pandas as pd
-
+import gc 
 
 class NRMS(Recommender):
     """NRMS model(Neural News Recommendation with Multi-Head Self-Attention)
@@ -154,7 +152,7 @@ def __init__(
 
 
         # Configure GPU settings
-        gpus = tf.config.experimental.list_physical_devices("GPU")
+        gpus = tf.config.list_physical_devices("GPU")
         if gpus:
             try:
                 for gpu in gpus:
@@ -167,7 +165,7 @@ def __init__(
         # with tf.device('/GPU:0'):
         self.model, self.scorer = self._build_graph()
         self.model.compile(loss="categorical_crossentropy",
-                            optimizer=tf.keras.optimizers.legacy.Adam(learning_rate=self.learning_rate))
+                            optimizer= keras.optimizers.Adam(learning_rate=self.learning_rate))
 
     def load_dict(self, file_path):
         """load json file
@@ -352,7 +350,6 @@ def fit(self, train_set, val_set=None):
             object: An instance of self.
         """
         Recommender.fit(self, train_set, val_set)
-
         self.train_set = train_set
         self.val_set = val_set
 
@@ -398,6 +395,10 @@ def fit(self, train_set, val_set=None):
             self.current_epoch = epoch
             epoch_loss = 0
 
+            #  Memory cleanup every few epochs 
+            if epoch > 1 and epoch % 3 == 0:
+                gc.collect()
+
             tqdm_util = tqdm(
                 self.news_organizer.load_data_from_file(train_set, self.npratio,self.batch_size), desc=f"Epoch {epoch}",
                 leave=False , # Removes stale progress bars
@@ -508,7 +509,7 @@ def score(self, user_idx, item_idx=None, **kwargs):
 
     
 
-        batch_size = 256  # Define batch size
+        batch_size = self.batch_size  # Define batch size
         candidate_title_indexes = []
         click_title_indexes = []
         # Get user's click history or handle unknown users
@@ -558,6 +559,8 @@ def score(self, user_idx, item_idx=None, **kwargs):
             )
 
             all_predictions.append(batch_prediction)
+            if (start // batch_size) % 8 == 0:
+                gc.collect()
 
         # Concatenate all batch predictions into a single array
         final_predictions = np.concatenate(all_predictions, axis=0)
@@ -690,7 +693,7 @@ def load_nrms(cls, save_dir):
         # Compile the model with the stored learning rate
         model.model.compile(
             loss="categorical_crossentropy",
-            optimizer=tf.keras.optimizers.legacy.Adam(learning_rate=model.learning_rate)
+            optimizer=keras.optimizers.Adam(learning_rate=model.learning_rate)
         )
 
         # Load the saved model weights
diff --git a/cornac/models/nrms/requirements.txt b/cornac/models/nrms/requirements.txt
index a60e137..8ad4080 100644
--- a/cornac/models/nrms/requirements.txt
+++ b/cornac/models/nrms/requirements.txt
@@ -1 +1 @@
-tensorflow==2.12.0
\ No newline at end of file
+tensorflow>=2.18.0
\ No newline at end of file
diff --git a/cornac/models/pcrl/pcrl.py b/cornac/models/pcrl/pcrl.py
index 331c7e6..8e6fa5b 100644
--- a/cornac/models/pcrl/pcrl.py
+++ b/cornac/models/pcrl/pcrl.py
@@ -379,7 +379,7 @@ def learn(self, train_set):
 
         for epoch in range(self.n_epoch):
             for idx in train_set.item_iter(self.batch_size, shuffle=False):
-                batch_C = self.aux_data[idx].A
+                batch_C = self.aux_data[idx].toarray()
                 EE = self.sess.run(E_, feed_dict={C: batch_C})
                 z_c = self.sess.run(X_g, feed_dict={C: batch_C, E: EE})
                 feed_dict = {
diff --git a/cornac/models/pld/recom_pld.py b/cornac/models/pld/recom_pld.py
index 403de37..436f21b 100644
--- a/cornac/models/pld/recom_pld.py
+++ b/cornac/models/pld/recom_pld.py
@@ -73,8 +73,9 @@ def __init__(
         **kwargs):
 
         Recommender.__init__(self, name=name, trainable=trainable, verbose=verbose, **kwargs)
-
-        self.party_dict = party_dict
+        
+        
+        self.party_dict = self._normalize_party_dict(party_dict)
         self.articles = list(party_dict.keys())
 
         # check the format of the distribution, make sure every user type has same article types, which means for every row there are same columns at the second element.
@@ -96,7 +97,40 @@ def __init__(
 
         self.group_recommendations_generated = False
 
+    def _find_config_section(self, config, model_name):
+        """Find configuration section case-insensitively."""
+        model_name_lower = model_name.lower()
+        
+        # Look for exact match (case-insensitive)
+        for section_name in config.sections():
+            if section_name.lower() == model_name_lower:
+                return section_name
+        
+        return None
 
+    def _get_config_value(self, section, primary_key, fallback_keys=None):
+        """Get configuration value with case-insensitive key matching."""
+        fallback_keys = fallback_keys or []
+        all_keys = [primary_key] + fallback_keys
+        
+        # Try each key (case-insensitive)
+        for key in all_keys:
+            # Try exact key first
+            if key in section:
+                return section[key].strip()
+            
+            # Try case-insensitive match
+            for actual_key in section.keys():
+                if actual_key.lower() == key.lower():
+                    return section[actual_key].strip()
+        
+        # If not found, raise error with helpful message
+        available_keys = list(section.keys())
+        raise ValueError(
+            f"Required configuration key not found. Tried: {all_keys}\n"
+            f"Available keys: {available_keys}"
+        )
+    
     def fit(self, train_set, val_set=None):
 
         """Fit the model to observations.
@@ -126,20 +160,54 @@ def fit(self, train_set, val_set=None):
             config = configparser.ConfigParser()
             config.read(self.configure_path)
 
-            section_name = self.name
+            section_name = self._find_config_section(config, self.name)
 
-            if section_name in config:
-                raw_parties = config[section_name].get('parties', '')
-                self.party_list = raw_parties.split(",")
-                # print(f"self.party_list: {self.party_list}")
+            if section_name:
+                raw_parties =  self._get_config_value(
+                    config[section_name], 
+                    'parties',
+                    ['party_list', 'party_names', 'political_parties']
+                )
+                self.party_list = [party.strip() for party in raw_parties.split(",") if party.strip()]
+                
+                # Case-insensitive key lookup with fallbacks
+                self.positive_score_party = self._get_config_value(
+                    config[section_name], 
+                    'positive_score_party_name',
+                    ['positive_party', 'pos_party']
+                )
+                self.negative_score_party = self._get_config_value(
+                    config[section_name],
+                    'negative_score_party_name', 
+                    ['negative_party', 'neg_party']
+                )
+                
+                if self.verbose:
+                    print(f"Using configuration section: [{section_name}]")
+                    print(f"Loaded parties: {self.party_list}")
+                    
             else:
+                available_sections = list(config.sections())
                 raise ValueError(
-                    f"Configuration Error: Section '{section_name}' not found in '{self.configure_path}'.\n"
-                    f"Please check your configuration file and ensure the section [{section_name}] exists."
+                    f"Configuration Error: No section found for model '{self.name}'.\n"
+                    f"Available sections: {available_sections}.\n"
                 )
 
-            self.positive_score_party = config[section_name]['positive_score_party_name']
-            self.negative_score_party = config[section_name]['negative_score_party_name']
+            # section_name = self.name
+
+
+            # if section_name in config:
+            #     raw_parties = config[section_name].get('parties', '')
+            #     self.party_list = raw_parties.split(",")
+            #     # print(f"self.party_list: {self.party_list}")
+            # else:
+            #     raise ValueError(
+            #         f"Configuration Error: Section '{section_name}' not found in '{self.configure_path}'.\n"
+            #         f"Please check your configuration file and ensure the section [{section_name}] exists."
+            #     )
+
+            # self.positive_score_party = config[section_name]['positive_score_party_name']
+            # self.negative_score_party = config[section_name]['negative_score_party_name']
 
             train_uir = list(zip(*train_set.uir_tuple))
 
@@ -160,6 +228,17 @@ def fit(self, train_set, val_set=None):
   
         return self
 
+    def _normalize_party_dict(self, party_dict):
+        """Normalize party dictionary for case-insensitive lookups."""
+        if not isinstance(party_dict, dict):
+            raise ValueError("party_dict must be a dictionary")
+        
+        normalized_dict = {}
+        for key, value in party_dict.items():
+            # Convert key to lowercase for consistent lookup
+            normalized_key = str(key).lower()
+            normalized_dict[normalized_key] = value
+        return normalized_dict
     
     def rank(self, user_idx, item_indices = None, k = -1, **kwargs):
         if not self.group_recommendations_generated:
diff --git a/cornac/models/pld/score_calculator.py b/cornac/models/pld/score_calculator.py
index d218f48..98e6e69 100644
--- a/cornac/models/pld/score_calculator.py
+++ b/cornac/models/pld/score_calculator.py
@@ -15,29 +15,28 @@ def calculatePoliticalScore(history_dict, party_dict_raw, party_list, num_users)
     user_score_matrix = np.full((num_users, len(party_list)), 0, dtype=float)
     party_dict = {}
     for k, v in party_dict_raw.items():
+        k_norm = str(k).lower()
         if len(list(v)) == 0:
-            party_dict[k] = -1
-            # party_dict[k] = 0
+            party_dict[k_norm] = -1
+            # party_dict[k_norm] = 0
         else:
-
             political_dict = {item: v[item] for item in party_list if item in v.keys()}
-
             if political_dict:
                 max_party = max(political_dict, key=political_dict.get)
-                party_dict[k] = party_list.index(max_party)
+                party_dict[k_norm] = party_list.index(max_party)
             else:
-                party_dict[k] = -1
-                # party_dict[k] = 0
+                party_dict[k_norm] = -1
+                # party_dict[k_norm] = 0
         
     for user_idx, article_list in history_dict.items():
-
         # Update: for multi-party situation
         for i, article in enumerate(article_list):
-            if article in party_dict.keys():
-                if party_dict[article] == -1:
+            article_norm = str(article).lower()
+            if article_norm in party_dict.keys():
+                if party_dict[article_norm] == -1:
                     continue
-                # print(party_dict[article])
-                user_score_matrix[user_idx][party_dict[article]] += 1
+                # print(party_dict[article_norm])
+                user_score_matrix[user_idx][party_dict[article_norm]] += 1
 
     # user_score_matrix = roundColumnScore(user_score_matrix)
     user_score_matrix =  compute_political_leaning(user_score_matrix)
@@ -81,12 +80,12 @@ def calculateArticleScore(history_dict, userScores, num_users, num_items, party_
     
     # for i in range(len(article_pool)):
     for i, article_id in enumerate(article_pool):
-        
-        parties = party_dict.get(article_id, {}) 
+        article_norm = str(article_id).lower()
+        parties = party_dict.get(article_norm, {})
 
         positive_score_parties_count = parties.get(positive_score_party_name, 0)
         negative_score_parties_count = parties.get(negative_score_party_name, 0)
-        
+
         article_mention_matrix[i, 0] = positive_score_parties_count  # First column for positive score party count (e.g., Republican count)
         article_mention_matrix[i, 1] = negative_score_parties_count    # Second column for negative score party count (e.g., Democrat count) 
 
diff --git a/cornac/models/pmf/recom_pmf.py b/cornac/models/pmf/recom_pmf.py
index 9cd5697..14a3976 100644
--- a/cornac/models/pmf/recom_pmf.py
+++ b/cornac/models/pmf/recom_pmf.py
@@ -144,7 +144,7 @@ def fit(self, train_set, val_set=None):
                 res = pmf.pmf_linear(
                     uid,
                     iid,
-                    rat,
+                    rat.astype(np.float32),
                     k=self.k,
                     n_users=self.num_users,
                     n_items=self.num_items,
@@ -161,7 +161,7 @@ def fit(self, train_set, val_set=None):
                 res = pmf.pmf_non_linear(
                     uid,
                     iid,
-                    rat,
+                    rat.astype(np.float32),
                     k=self.k,
                     n_users=self.num_users,
                     n_items=self.num_items,
diff --git a/cornac/models/recommender.py b/cornac/models/recommender.py
index 2da5944..f0149c9 100644
--- a/cornac/models/recommender.py
+++ b/cornac/models/recommender.py
@@ -191,11 +191,9 @@ def item_ids(self):
         if self.__item_ids is None:
             self.__item_ids = list(self.iid_map.keys())
         return self.__item_ids
-        # self.ranked_items = {}
-        # self.item_scores = {}
 
     def reset_info(self):
-        self.best_value = -np.Inf
+        self.best_value = float("-inf")
         self.best_epoch = 0
         self.current_epoch = 0
         self.stopped_epoch = 0
@@ -219,8 +217,7 @@ def _get_init_params(cls):
             return []
 
         init_signature = inspect.signature(init)
-        parameters = [p for p in init_signature.parameters.values()
-                      if p.name != "self"]
+        parameters = [p for p in init_signature.parameters.values() if p.name != "self"]
 
         return sorted([p.name for p in parameters])
 
@@ -498,8 +495,7 @@ def score(self, user_idx, item_idx=None):
             Relative scores that the user gives to the item or to all known items
 
         """
-        raise NotImplementedError(
-            "The algorithm is not able to make score prediction!")
+        raise NotImplementedError("The algorithm is not able to make score prediction!")
 
     def default_score(self):
         """Overwrite this function if your algorithm has special treatment for cold-start problem"""
@@ -644,7 +640,6 @@ def rank(self, user_idx, item_indices=None, k=-1, **kwargs):
             if item_indices is None
             else np.asarray(item_indices)
         )
-      
         item_scores = all_item_scores[item_indices]
 
         if k != -1:  # O(n + k log k), faster for small k which is usually the case
diff --git a/cornac/models/sansa/README.md b/cornac/models/sansa/README.md
new file mode 100644
index 0000000..92ae76f
--- /dev/null
+++ b/cornac/models/sansa/README.md
@@ -0,0 +1,10 @@
+# Dependencies
+Training of SANSA uses [scikit-sparse](https://github.com/scikit-sparse/scikit-sparse), which depends on the [SuiteSparse](https://github.com/DrTimothyAldenDavis/SuiteSparse) numerical library. To install SuiteSparse on Ubuntu and macOS, run the commands below:
+```
+# Ubuntu
+sudo apt-get install libsuitesparse-dev
+
+# macOS
+brew install suite-sparse
+```
+After installing SuiteSparse, simply install the requirements.txt.
\ No newline at end of file
diff --git a/cornac/models/sansa/__init__.py b/cornac/models/sansa/__init__.py
new file mode 100644
index 0000000..67f4f75
--- /dev/null
+++ b/cornac/models/sansa/__init__.py
@@ -0,0 +1 @@
+from .recom_sansa import SANSA
diff --git a/cornac/models/sansa/recom_sansa.py b/cornac/models/sansa/recom_sansa.py
new file mode 100644
index 0000000..21bfe67
--- /dev/null
+++ b/cornac/models/sansa/recom_sansa.py
@@ -0,0 +1,289 @@
+import numpy as np
+import scipy.sparse as sp
+
+from ..recommender import Recommender
+from ..recommender import ANNMixin, MEASURE_DOT
+from ...exception import ScoreException
+
+
+class SANSA(Recommender, ANNMixin):
+    """Scalable Approximate NonSymmetric Autoencoder for Collaborative Filtering.
+
+    Parameters
+    ----------
+    name: string, optional, default: 'SANSA'
+        The name of the recommender model.
+
+    l2: float, optional, default: 1.0
+        L2-norm regularization-parameter λ ∈ R+.
+    
+    weight_matrix_density: float, optional, default: 1e-3
+        Density of weight matrices. 
+
+    compute_gramian: boolean, optional, default: True
+        Indicates whether training input X is a user-item matrix (represents a bipartite graph) or \
+        or an item-item matrix (e.g, co-occurrence matrix; not a bipartite graph).
+
+    factorizer_class: string, optional, default: 'ICF'
+        Class of Cholesky factorizer. Supported values:
+        - 'CHOLMOD' - exact Cholesky factorization using CHOLMOD algorithm, followed by pruning.
+        - 'ICF' - Incomplete Cholesky factorization (i.e., pruning on-the-fly)
+        CHOLMOD provides higher-quality approximate factorization for increased price. \
+        ICF is less accurate but more scalable (recommended method when num_items >= ~50K-100K).
+        Note that ICF uses additional matrix preprocessing and hence different (smaller) l2 regularization.
+        
+    factorizer_shift_step: float, optional, default: 1e-3
+        Used with ICF factorizer.
+        Incomplete factorization may break (zero division), indicating need for increased l2 regularization.
+        'factorizer_shift_step' is the initial increase in l2 regularization (after first breakdown).
+
+    factorizer_shift_multiplier: float, optional, default: 2.0
+        Used with ICF factorizer.
+        Multiplier for factorizer shift. After k-th breakdown, additional l2 regularization is \
+        'factorizer_shift_step' * 'factorizer_shift_multiplier'^(k-1)
+
+    inverter_scans: integer, optional, default: 3
+        Number of scans repairing the approximate inverse factor. Scans repair all columns with residual below \
+        a certain threshold, and this threshold goes to 0 in later scans. More scans give more accurate results \
+        but take longer. We recommend values between 0 and 5, use lower values if scans take too long.
+
+    inverter_finetune_steps: integer, optional, default: 10
+        Repairs a small portion of columns with highest residuals. All finetune steps take (roughly) the same amount of time.
+        We recommend values between 0 and 30.
+
+    use_absolute_value_scores: boolean, optional, default: False
+        Following https://dl.acm.org/doi/abs/10.1145/3640457.3688179, it is recommended for EASE-like models to consider \
+        the absolute value of scores in situations when X^TX is sparse.
+
+    trainable: boolean, optional, default: True
+        When False, the model is not trained and Cornac assumes that the model is already \
+        trained. 
+        
+    verbose: boolean, optional, default: False
+        When True, some running logs are displayed.
+
+    seed: int, optional, default: None
+        Random seed for parameters initialization.
+
+    References
+    ----------
+    * Martin Spišák, Radek Bartyzal, Antonín Hoskovec, Ladislav Peska, and Miroslav Tůma. 2023. \
+    Scalable Approximate NonSymmetric Autoencoder for Collaborative Filtering. \
+    In Proceedings of the 17th ACM Conference on Recommender Systems (RecSys '23). \
+    Association for Computing Machinery, New York, NY, USA, 763–770. https://doi.org/10.1145/3604915.3608827
+
+    * SANSA GitHub Repository: https://github.com/glami/sansa
+    """
+
+    def __init__(
+        self,
+        name="SANSA",
+        l2=1.0,
+        weight_matrix_density=1e-3,
+        compute_gramian=True,
+        factorizer_class="ICF",
+        factorizer_shift_step=1e-3,
+        factorizer_shift_multiplier=2.0,
+        inverter_scans=3,
+        inverter_finetune_steps=10,
+        use_absolute_value_scores=False,
+        trainable=True,
+        verbose=True,
+        seed=None,
+        W1=None,  # "weights[0] (sp.csr_matrix)"
+        W2=None,  # "weights[1] (sp.csr_matrix)"
+        X=None,  # user-item interaction matrix (sp.csr_matrix)
+    ):
+        Recommender.__init__(self, name=name, trainable=trainable, verbose=verbose)
+        self.l2 = l2
+        self.weight_matrix_density = weight_matrix_density
+        self.compute_gramian = compute_gramian
+        self.factorizer_class = factorizer_class
+        self.factorizer_shift_step = factorizer_shift_step
+        self.factorizer_shift_multiplier = factorizer_shift_multiplier
+        self.inverter_scans = inverter_scans
+        self.inverter_finetune_steps = inverter_finetune_steps
+        self.use_absolute_value_scores = use_absolute_value_scores
+        self.verbose = verbose
+        self.seed = seed
+        self.X = X.astype(np.float32) if X is not None and X.dtype != np.float32 else X
+        self.weights = (W1, W2)
+
+    def fit(self, train_set, val_set=None):
+        """Fit the model to observations.
+
+        Parameters
+        ----------
+        train_set: :obj:`cornac.data.Dataset`, required
+            User-Item preference data as well as additional modalities.
+
+        val_set: :obj:`cornac.data.Dataset`, optional, default: None
+            User-Item preference data for model selection purposes (e.g., early stopping).
+
+        Returns
+        -------
+        self : object
+        """
+        Recommender.fit(self, train_set, val_set)
+
+        from sansa.core import (
+            FactorizationMethod,
+            GramianFactorizer,
+            CHOLMODGramianFactorizerConfig,
+            ICFGramianFactorizerConfig,
+            UnitLowerTriangleInverter,
+            UMRUnitLowerTriangleInverterConfig,
+        )
+        from sansa.utils import get_squared_norms_along_compressed_axis, inplace_scale_along_compressed_axis, inplace_scale_along_uncompressed_axis
+
+        # User-item interaction matrix (sp.csr_matrix)
+        self.X = train_set.matrix.astype(np.float32)
+
+        if self.factorizer_class == "CHOLMOD":
+            self.factorizer_config = CHOLMODGramianFactorizerConfig()
+        else:
+            self.factorizer_config = ICFGramianFactorizerConfig(
+                factorization_shift_step=self.factorizer_shift_step,  # initial diagonal shift if incomplete factorization fails
+                factorization_shift_multiplier=self.factorizer_shift_multiplier,  # multiplier for the shift for subsequent attempts
+            )
+        self.factorizer = GramianFactorizer.from_config(self.factorizer_config)
+        self.factorization_method = self.factorizer_config.factorization_method
+
+        self.inverter_config = UMRUnitLowerTriangleInverterConfig(
+            scans=self.inverter_scans,  # number of scans through all columns of the matrix
+            finetune_steps=self.inverter_finetune_steps,  # number of finetuning steps, targeting worst columns
+        )
+        self.inverter = UnitLowerTriangleInverter.from_config(self.inverter_config)
+
+        # create a working copy of user_item_matrix
+        X = self.X.copy()
+
+        if self.factorization_method == FactorizationMethod.ICF:
+            # scale matrix X
+            if self.compute_gramian:
+                # Inplace scale columns of X by square roots of column norms of X^TX.
+                da = np.sqrt(np.sqrt(get_squared_norms_along_compressed_axis(X.T @ X)))
+                # Divide columns of X by the computed square roots of row norms of X^TX
+                da[da == 0] = 1  # ignore zero elements
+                inplace_scale_along_uncompressed_axis(X, 1 / da)  # CSR column scaling
+                del da
+            else:
+                # Inplace scale rows and columns of X by square roots of row norms of X.
+                da = np.sqrt(np.sqrt(get_squared_norms_along_compressed_axis(X)))
+                # Divide rows and columns of X by the computed square roots of row norms of X
+                da[da == 0] = 1  # ignore zero elements
+                inplace_scale_along_uncompressed_axis(X, 1 / da)  # CSR column scaling
+                inplace_scale_along_compressed_axis(X, 1 / da)  # CSR row scaling
+                del da
+
+        # Compute LDL^T decomposition of
+        # - P(X^TX + self.l2 * I)P^T if compute_gramian=True
+        # - P(X + self.l2 * I)P^T if compute_gramian=False
+        if self.verbose:
+            print("Computing LDL^T decomposition of permuted item-item matrix...")
+        L, D, p = self.factorizer.approximate_ldlt(
+            X,
+            self.l2,
+            self.weight_matrix_density,
+            compute_gramian=self.compute_gramian,
+        )
+        del X
+
+        # Compute approximate inverse of L using selected method
+        if self.verbose:
+            print("Computing approximate inverse of L...")
+        L_inv = self.inverter.invert(L)
+        del L
+
+        # Construct W = L_inv @ P
+        inv_p = np.argsort(p)
+        W = L_inv[:, inv_p]
+        del L_inv
+
+        # Construct W_r (A^{-1} = W.T @ W_r)
+        W_r = W.copy()
+        inplace_scale_along_uncompressed_axis(W_r, 1 / D.diagonal())
+
+        # Extract diagonal entries
+        diag = W.copy()
+        diag.data = diag.data**2
+        inplace_scale_along_uncompressed_axis(diag, 1 / D.diagonal())
+        diagsum = diag.sum(axis=0)  # original
+        del diag
+        diag = np.asarray(diagsum)[0]
+
+        # Divide columns of the inverse by negative diagonal entries
+        # equivalent to dividing the columns of W by negative diagonal entries
+        inplace_scale_along_compressed_axis(W_r, -1 / diag)
+        self.weights = (W.T.tocsr(), W_r.tocsr())
+
+        return self
+
+    def forward(self, X: sp.csr_matrix) -> sp.csr_matrix:
+        """
+        Forward pass.
+        """
+        latent = X @ self.weights[0]
+        out = latent @ self.weights[1]
+        return out
+
+    def score(self, user_idx, item_idx=None):
+        """Predict the scores/ratings of a user for an item.
+
+        Parameters
+        ----------
+        user_idx: int, required
+            The index of the user for whom to perform score prediction.
+
+        item_idx: int, optional, default: None
+            The index of the item for which to perform score prediction.
+            If None, scores for all known items will be returned.
+
+        Returns
+        -------
+        res : A scalar or a Numpy array
+            Relative scores that the user gives to the item or to all known items
+
+        """
+        if self.is_unknown_user(user_idx):
+            raise ScoreException("Can't make score prediction for user %d" % user_idx)
+
+        if item_idx is not None and self.is_unknown_item(item_idx):
+            raise ScoreException("Can't make score prediction for item %d" % item_idx)
+
+        scores = self.forward(self.X[user_idx]).toarray().reshape(-1)
+        if self.use_absolute_value_scores:
+            scores = np.abs(scores)
+        if item_idx is None:
+            return scores
+        return scores[item_idx]
+
+    def get_vector_measure(self):
+        """Getting a valid choice of vector measurement in ANNMixin._measures.
+
+        Returns
+        -------
+        measure: MEASURE_DOT
+            Dot product aka. inner product
+        """
+        return MEASURE_DOT
+
+    def get_user_vectors(self):
+        """Getting a matrix of user vectors serving as query for ANN search.
+
+        Returns
+        -------
+        out: numpy.array
+            Matrix of user vectors for all users available in the model.
+        """
+        return self.X @ self.weights[0]
+
+    def get_item_vectors(self):
+        """Getting a matrix of item vectors used for building the index for ANN search.
+
+        Returns
+        -------
+        out: numpy.array
+            Matrix of item vectors for all items available in the model.
+        """
+        return self.self.weights[1]
diff --git a/cornac/models/sansa/requirements.txt b/cornac/models/sansa/requirements.txt
new file mode 100644
index 0000000..b898b4b
--- /dev/null
+++ b/cornac/models/sansa/requirements.txt
@@ -0,0 +1 @@
+sansa >= 1.1.0
\ No newline at end of file
diff --git a/cornac/models/vaecf/recom_vaecf.py b/cornac/models/vaecf/recom_vaecf.py
index a6a4777..f29d6db 100644
--- a/cornac/models/vaecf/recom_vaecf.py
+++ b/cornac/models/vaecf/recom_vaecf.py
@@ -38,7 +38,6 @@ class VAECF(Recommender):
     likelihood: str, default: 'mult'
         Name of the likelihood function used for modeling the observations.
         Supported choices:
-        
         mult: Multinomial likelihood
         bern: Bernoulli likelihood
         gaus: Gaussian likelihood
@@ -193,16 +192,10 @@ def score(self, user_idx, item_idx=None,**kwargs):
         if item_idx is None:
             x_u = self.r_mat[user_idx].copy()
             x_u.data = np.ones(len(x_u.data))
-            z_u, _ = self.vae.encode(
-                torch.tensor(x_u.A, dtype=torch.float32, device=self.device)
-            )
+            z_u, _ = self.vae.encode(torch.tensor(x_u.toarray(), dtype=torch.float32, device=self.device))
             return self.vae.decode(z_u).data.cpu().numpy().flatten()
         else:
             x_u = self.r_mat[user_idx].copy()
             x_u.data = np.ones(len(x_u.data))
-            z_u, _ = self.vae.encode(
-                torch.tensor(x_u.A, dtype=torch.float32, device=self.device)
-            )
-            return (
-                self.vae.decode(z_u).data.cpu().numpy().flatten()[item_idx]
-            )  # Fix me I am not efficient
+            z_u, _ = self.vae.encode(torch.tensor(x_u.toarray(), dtype=torch.float32, device=self.device))
+            return self.vae.decode(z_u).data.cpu().numpy().flatten()[item_idx]  # Fix me I am not efficient
diff --git a/cornac/models/vaecf/vaecf.py b/cornac/models/vaecf/vaecf.py
index e5bbdc7..5a5bca4 100644
--- a/cornac/models/vaecf/vaecf.py
+++ b/cornac/models/vaecf/vaecf.py
@@ -89,7 +89,7 @@ def loss(self, x, x_, mu, logvar, beta):
         ll_choices = {
             "mult": x * torch.log(x_ + EPS),
             "bern": x * torch.log(x_ + EPS) + (1 - x) * torch.log(1 - x_ + EPS),
-            "gaus": -(x - x_) ** 2,
+            "gaus": -((x - x_) ** 2),
             "pois": x * torch.log(x_ + EPS) - x_,
         }
 
@@ -129,7 +129,7 @@ def learn(
         ):
             u_batch = train_set.matrix[u_ids, :]
             u_batch.data = np.ones(len(u_batch.data))  # Binarize data
-            u_batch = u_batch.A
+            u_batch = u_batch.toarray()
             u_batch = torch.tensor(u_batch, dtype=torch.float32, device=device)
 
             # Reconstructed batch
diff --git a/cornac/models/wmf/recom_wmf.py b/cornac/models/wmf/recom_wmf.py
index 92416b7..9467041 100644
--- a/cornac/models/wmf/recom_wmf.py
+++ b/cornac/models/wmf/recom_wmf.py
@@ -66,7 +66,6 @@ class WMF(Recommender, ANNMixin):
 
         U: ndarray, shape (n_users,k)
             The user latent factors, optional initialization via init_params.
-            
         V: ndarray, shape (n_items,k)
             The item latent factors, optional initialization via init_params.
 
@@ -191,7 +190,7 @@ def _fit_cf(self, train_set):
                     batch_C = np.ones(batch_R.shape) * self.b
                     batch_C[batch_R.nonzero()] = self.a
                     feed_dict = {
-                        model.ratings: batch_R.A,
+                        model.ratings: batch_R.toarray(),
                         model.C: batch_C,
                         model.item_ids: batch_ids,
                     }
diff --git a/cornac/serving/app.py b/cornac/serving/app.py
index 41e9225..ffa8c07 100644
--- a/cornac/serving/app.py
+++ b/cornac/serving/app.py
@@ -119,7 +119,7 @@ def create_app():
 
 @app.route("/recommend", methods=["GET"])
 def recommend():
-    global model, train_set
+    global model, train_set # noqa: F824
 
     if model is None:
         return "Model is not yet loaded. Please try again later.", 400
@@ -187,7 +187,7 @@ def add_feedback():
 
 @app.route("/evaluate", methods=["POST"])
 def evaluate():
-    global model, train_set, metric_classnames
+    global model, train_set, metric_classnames # noqa: F824
 
     if model is None:
         return "Model is not yet loaded. Please try again later.", 400
@@ -241,7 +241,7 @@ def validate_query(query):
 
 
 def process_evaluation(test_set, query, exclude_unknowns):
-    global model, train_set
+    global model, train_set # noqa: F824
     
     rating_threshold = query.get("rating_threshold", 1.0)
     user_based = (
diff --git a/cornac/utils/common.py b/cornac/utils/common.py
index ef0a23e..c56c5d1 100644
--- a/cornac/utils/common.py
+++ b/cornac/utils/common.py
@@ -20,7 +20,6 @@
 import scipy.sparse as sp
 import pandas as pd
 import random
-import pandas as pd
 import math
 from .fast_sparse_funcs import (
     inplace_csr_row_normalize_l1,
@@ -102,7 +101,7 @@ def clip(values, lower_bound, upper_bound):
 def intersects(x, y, assume_unique=False):
     """Return the intersection of given two arrays
     """
-    mask = np.in1d(x, y, assume_unique=assume_unique)
+    mask = np.isin(x, y, assume_unique=assume_unique)
     x_intersects_y = x[mask]
 
     return x_intersects_y
@@ -111,7 +110,7 @@ def intersects(x, y, assume_unique=False):
 def excepts(x, y, assume_unique=False):
     """Removing elements in array y from array x
     """
-    mask = np.in1d(x, y, assume_unique=assume_unique, invert=True)
+    mask = np.isin(x, y, assume_unique=assume_unique, invert=True)
     x_excepts_y = x[mask]
 
     return x_excepts_y
@@ -149,9 +148,8 @@ def validate_format(input_format, valid_formats):
     """Check the input format is in list of valid formats
     :raise ValueError if not supported
     """
-    if not input_format in valid_formats:
-        raise ValueError('{} data format is not in valid formats ({})'.format(
-            input_format, valid_formats))
+    if input_format not in valid_formats:
+        raise ValueError('{} data format is not in valid formats ({})'.format(input_format, valid_formats))
 
     return input_format
 
@@ -591,8 +589,7 @@ def get_rng(seed):
         return np.random.RandomState(seed)
     if isinstance(seed, np.random.RandomState):
         return seed
-    raise ValueError(
-        '{} can not be used to create a numpy.random.RandomState'.format(seed))
+    raise ValueError('{} can not be used to create a numpy.random.RandomState'.format(seed))
 
 
 def normalize(X, norm='l2', axis=1, copy=True):
@@ -643,7 +640,6 @@ def normalize(X, norm='l2', axis=1, copy=True):
         elif norm == 'l2':
             inplace_csr_row_normalize_l2(X_out)
         elif norm == 'max':
-            # norms = X_out.max(axis=1).A
             norms = X_out.max(axis=1).toarray()
             norms_elementwise = norms.repeat(np.diff(X_out.indptr))
             mask = norms_elementwise != 0
diff --git a/cornac/utils/newsrec_utils/layers.py b/cornac/utils/newsrec_utils/layers.py
index de10605..2a75de4 100644
--- a/cornac/utils/newsrec_utils/layers.py
+++ b/cornac/utils/newsrec_utils/layers.py
@@ -1,21 +1,9 @@
 # Copyright (c) Recommenders contributors.
 # Licensed under the MIT License.
 import tensorflow as tf
-tf.compat.v1.disable_eager_execution()  # Enables TensorFlow 1.x behavior in TF 2.x
-keras = tf.compat.v1.keras
-
-# import tensorflow as tf
-# einsum = tf.linalg.einsum  
-
-# from tensorflow.keras import layers
-# from tensorflow.keras import backend as K
-# import tensorflow.keras as keras  
-
-import tensorflow.compat.v1.keras as keras
-from tensorflow.compat.v1.linalg import einsum
-from tensorflow.compat.v1.keras import layers
-from tensorflow.compat.v1.keras import backend as K
-
+from tensorflow import keras
+from tensorflow.keras import layers
+from tensorflow.keras import backend as K
 
 class AttLayer2(layers.Layer):
     """Soft alignment attention implement.
@@ -30,7 +18,6 @@ def __init__(self, dim=200, seed=0, **kwargs):
         Args:
             dim (int): attention hidden dim
         """
-
         self.dim = dim
         self.seed = seed
         super(AttLayer2, self).__init__(**kwargs)
@@ -42,28 +29,27 @@ def build(self, input_shape):
         Args:
             input_shape (object): shape of input tensor.
         """
-
         assert len(input_shape) == 3
         dim = self.dim
         self.W = self.add_weight(
             name="W",
             shape=(int(input_shape[-1]), dim),
-            initializer=keras.initializers.glorot_uniform(seed=self.seed),
+            initializer=tf.keras.initializers.GlorotUniform(seed=self.seed),
             trainable=True,
         )
         self.b = self.add_weight(
             name="b",
             shape=(dim,),
-            initializer=keras.initializers.Zeros(),
+            initializer=tf.keras.initializers.Zeros(),
             trainable=True,
         )
         self.q = self.add_weight(
             name="q",
             shape=(dim, 1),
-            initializer=keras.initializers.glorot_uniform(seed=self.seed),
+            initializer=tf.keras.initializers.GlorotUniform(seed=self.seed),
             trainable=True,
         )
-        super(AttLayer2, self).build(input_shape)  # be sure you call this somewhere!
+        super(AttLayer2, self).build(input_shape)
 
     def call(self, inputs, mask=None, **kwargs):
         """Core implementation of soft attention.
@@ -74,16 +60,14 @@ def call(self, inputs, mask=None, **kwargs):
         Returns:
             object: weighted sum of input tensors.
         """
-
         attention = K.tanh(K.dot(inputs, self.W) + self.b)
         attention = K.dot(attention, self.q)
-
         attention = K.squeeze(attention, axis=2)
 
         if mask is None:
             attention = K.exp(attention)
         else:
-            attention = K.exp(attention) * K.cast(mask, dtype="float32")
+            attention = K.exp(attention) * tf.cast(mask, dtype=tf.float32)
 
         attention_weight = attention / (
             K.sum(attention, axis=-1, keepdims=True) + K.epsilon()
@@ -130,14 +114,13 @@ class SelfAttention(layers.Layer):
     """
 
     def __init__(self, multiheads, head_dim, seed=0, mask_right=False, **kwargs):
-        """Initialization steps for AttLayer2.
+        """Initialization steps for SelfAttention.
 
         Args:
             multiheads (int): The number of heads.
             head_dim (object): Dimension of each head.
             mask_right (boolean): Whether to mask right words.
         """
-
         self.multiheads = multiheads
         self.head_dim = head_dim
         self.output_dim = multiheads * head_dim
@@ -151,7 +134,6 @@ def compute_output_shape(self, input_shape):
         Returns:
             tuple: output shape tuple.
         """
-
         return (input_shape[0][0], input_shape[0][1], self.output_dim)
 
     def build(self, input_shape):
@@ -164,23 +146,22 @@ def build(self, input_shape):
         Args:
             input_shape (object): shape of input tensor.
         """
-
         self.WQ = self.add_weight(
             name="WQ",
             shape=(int(input_shape[0][-1]), self.output_dim),
-            initializer=keras.initializers.glorot_uniform(seed=self.seed),
+            initializer=tf.keras.initializers.GlorotUniform(seed=self.seed),
             trainable=True,
         )
         self.WK = self.add_weight(
             name="WK",
             shape=(int(input_shape[1][-1]), self.output_dim),
-            initializer=keras.initializers.glorot_uniform(seed=self.seed),
+            initializer=tf.keras.initializers.GlorotUniform(seed=self.seed),
             trainable=True,
         )
         self.WV = self.add_weight(
             name="WV",
             shape=(int(input_shape[2][-1]), self.output_dim),
-            initializer=keras.initializers.glorot_uniform(seed=self.seed),
+            initializer=tf.keras.initializers.GlorotUniform(seed=self.seed),
             trainable=True,
         )
         super(SelfAttention, self).build(input_shape)
@@ -195,15 +176,14 @@ def Mask(self, inputs, seq_len, mode="add"):
         Returns:
             object: tensors after masking.
         """
-
         if seq_len is None:
             return inputs
         else:
-            mask = K.one_hot(indices=seq_len[:, 0], num_classes=K.shape(inputs)[1])
-            mask = 1 - K.cumsum(mask, axis=1)
+            mask = tf.one_hot(indices=seq_len[:, 0], depth=tf.shape(inputs)[1])
+            mask = 1 - tf.cumsum(mask, axis=1)
 
             for _ in range(len(inputs.shape) - 2):
-                mask = K.expand_dims(mask, 2)
+                mask = tf.expand_dims(mask, 2)
 
             if mode == "mul":
                 return inputs * mask
@@ -224,45 +204,44 @@ def call(self, QKVs):
             Q_len, V_len = None, None
         elif len(QKVs) == 5:
             Q_seq, K_seq, V_seq, Q_len, V_len = QKVs
+
         Q_seq = K.dot(Q_seq, self.WQ)
-        Q_seq = K.reshape(
-            Q_seq, shape=(-1, K.shape(Q_seq)[1], self.multiheads, self.head_dim)
+        Q_seq = tf.reshape(
+            Q_seq, shape=(-1, tf.shape(Q_seq)[1], self.multiheads, self.head_dim)
         )
-        Q_seq = K.permute_dimensions(Q_seq, pattern=(0, 2, 1, 3))
+        Q_seq = tf.transpose(Q_seq, perm=[0, 2, 1, 3])
 
         K_seq = K.dot(K_seq, self.WK)
-        K_seq = K.reshape(
-            K_seq, shape=(-1, K.shape(K_seq)[1], self.multiheads, self.head_dim)
+        K_seq = tf.reshape(
+            K_seq, shape=(-1, tf.shape(K_seq)[1], self.multiheads, self.head_dim)
         )
-        K_seq = K.permute_dimensions(K_seq, pattern=(0, 2, 1, 3))
+        K_seq = tf.transpose(K_seq, perm=[0, 2, 1, 3])
 
         V_seq = K.dot(V_seq, self.WV)
-        V_seq = K.reshape(
-            V_seq, shape=(-1, K.shape(V_seq)[1], self.multiheads, self.head_dim)
+        V_seq = tf.reshape(
+            V_seq, shape=(-1, tf.shape(V_seq)[1], self.multiheads, self.head_dim)
         )
-        V_seq = K.permute_dimensions(V_seq, pattern=(0, 2, 1, 3))
+        V_seq = tf.transpose(V_seq, perm=[0, 2, 1, 3])
 
-        A = einsum("abij, abkj -> abik", Q_seq, K_seq) / K.sqrt(
-            K.cast(self.head_dim, dtype="float32")
+        A = tf.einsum("abij,abkj->abik", Q_seq, K_seq) / tf.sqrt(
+            tf.cast(self.head_dim, dtype=tf.float32)
         )
-        A = K.permute_dimensions(
-            A, pattern=(0, 3, 2, 1)
-        )  # A.shape=[batch_size,K_sequence_length,Q_sequence_length,self.multiheads]
+        A = tf.transpose(A, perm=[0, 3, 2, 1])
 
         A = self.Mask(A, V_len, "add")
-        A = K.permute_dimensions(A, pattern=(0, 3, 2, 1))
+        A = tf.transpose(A, perm=[0, 3, 2, 1])
 
         if self.mask_right:
-            ones = K.ones_like(A[:1, :1])
-            lower_triangular = K.tf.matrix_band_part(ones, num_lower=-1, num_upper=0)
+            ones = tf.ones_like(A[:1, :1])
+            lower_triangular = tf.linalg.band_part(ones, num_lower=-1, num_upper=0)
             mask = (ones - lower_triangular) * 1e12
             A = A - mask
-        A = K.softmax(A)
+        A = tf.nn.softmax(A)
 
-        O_seq = einsum("abij, abjk -> abik", A, V_seq)
-        O_seq = K.permute_dimensions(O_seq, pattern=(0, 2, 1, 3))
+        O_seq = tf.einsum("abij,abjk->abik", A, V_seq)
+        O_seq = tf.transpose(O_seq, perm=[0, 2, 1, 3])
 
-        O_seq = K.reshape(O_seq, shape=(-1, K.shape(O_seq)[1], self.output_dim))
+        O_seq = tf.reshape(O_seq, shape=(-1, tf.shape(O_seq)[1], self.output_dim))
         O_seq = self.Mask(O_seq, Q_len, "mul")
         return O_seq
 
@@ -278,6 +257,7 @@ def get_config(self):
                 "multiheads": self.multiheads,
                 "head_dim": self.head_dim,
                 "mask_right": self.mask_right,
+                "seed": self.seed,
             }
         )
         return config
@@ -294,21 +274,21 @@ def PersonalizedAttentivePooling(dim1, dim2, dim3, seed=0):
     Returns:
         object: weighted summary of inputs value.
     """
-    vecs_input = keras.Input(shape=(dim1, dim2), dtype="float32")
-    query_input = keras.Input(shape=(dim3,), dtype="float32")
+    vecs_input = tf.keras.Input(shape=(dim1, dim2), dtype=tf.float32)
+    query_input = tf.keras.Input(shape=(dim3,), dtype=tf.float32)
 
     user_vecs = layers.Dropout(0.2)(vecs_input)
     user_att = layers.Dense(
         dim3,
         activation="tanh",
-        kernel_initializer=keras.initializers.glorot_uniform(seed=seed),
-        bias_initializer=keras.initializers.Zeros(),
+        kernel_initializer=tf.keras.initializers.GlorotUniform(seed=seed),
+        bias_initializer=tf.keras.initializers.Zeros(),
     )(user_vecs)
     user_att2 = layers.Dot(axes=-1)([query_input, user_att])
     user_att2 = layers.Activation("softmax")(user_att2)
     user_vec = layers.Dot((1, 1))([user_vecs, user_att2])
 
-    model = keras.Model([vecs_input, query_input], user_vec)
+    model = tf.keras.Model([vecs_input, query_input], user_vec)
     return model
 
 
@@ -331,8 +311,8 @@ def call(self, inputs, **kwargs):
         Returns:
             bool tensor: True for values not equal to zero.
         """
-        mask = K.not_equal(inputs, 0)
-        return K.cast(mask, K.floatx())
+        mask = tf.not_equal(inputs, 0)
+        return tf.cast(mask, tf.float32)
 
     def compute_output_shape(self, input_shape):
         return input_shape
@@ -363,7 +343,7 @@ def call(self, inputs, **kwargs):
         Returns:
             object: tensor after setting values to zero.
         """
-        return inputs[0] * K.expand_dims(inputs[1])
+        return inputs[0] * tf.expand_dims(inputs[1], axis=-1)
 
     def compute_output_shape(self, input_shape):
         return input_shape[0]
\ No newline at end of file
diff --git a/cornac/utils/newsrec_utils/newsrec_utils.py b/cornac/utils/newsrec_utils/newsrec_utils.py
index 79655c3..4a1146f 100644
--- a/cornac/utils/newsrec_utils/newsrec_utils.py
+++ b/cornac/utils/newsrec_utils/newsrec_utils.py
@@ -3,183 +3,356 @@
 import numpy as np
 import json
 import pandas as pd
+import gc
+from typing import Dict, List, Any, Generator, Tuple
+from collections import OrderedDict
 
 class NewsRecUtil:
-    def __init__(self,news_title = None, word_dict = None, impressionRating = None, user_history = None, history_size=50, title_size = 30 ):
-        self.hisory_size = history_size
+    """
+    Utility class for processing news recommendation data.
+    Handles news title processing, user history management, and batch generation
+    for neural news recommendation models.
+    """
+    
+    def __init__(self, news_title=None, word_dict=None, impressionRating=None, 
+                 user_history=None, history_size=50, title_size=30,
+                              max_cache_size=1000, batch_memory_limit=64):
+        """
+        Initialize NewsRecUtil with news data and configuration.
+        
+        Parameters:
+        -----------
+        news_title : dict
+            Dictionary mapping news IDs to news titles
+        word_dict : dict
+            Dictionary mapping words to indices
+        impressionRating : dict
+            Dictionary containing positive and negative ratings for users
+        user_history : dict
+            Dictionary mapping user IDs to their historical interactions
+        history_size : int
+            Maximum number of historical articles to consider per user
+        title_size : int
+            Maximum number of words per news title
+        """
+        self.history_size = history_size  # Fixed typo from 'hisory_size'
         self.title_size = title_size
         self.impressionRating = impressionRating
-        self.user_history  = user_history
+        self.user_history = user_history
         self.news_title = news_title
         self.word_dict = word_dict
         self.click_title_all_users = {}
- 
+        
+        # Caching mechanisms to improve performance
+        self._mappings_cached = False
+        
+        # Memory optimization settings
+        self.max_cache_size = max_cache_size
+        self.batch_memory_limit = batch_memory_limit  # Limit batch size for memory efficiency
+        
+        # Pre-allocated arrays for batch generation (will be initialized later)
+        self._batch_arrays = None
 
-    def newsample(self, news, ratio):
-        """Sample ratio samples from news list.
-        If length of news is less than ratio, pad zeros.
+        self._word_pattern = re.compile(r"[\w]+|[.,!?;|]")
+
+        self.user_history_cache = OrderedDict()  # Use OrderedDict for LRU
+        self.news_tokenization_cache = OrderedDict()
+        
+    def newsample(self, news: List[int], ratio: int) -> List[int]:
+        """
+        Sample a specified number of items from news list.
+        If length of news is less than ratio, pad with zeros.
 
         Parameters:
-        -------------
-            news (list): input news list, indexes
-            ratio (int): sample number
+        -----------
+        news : list
+            Input news list with item indices
+        ratio : int
+            Number of samples to draw
 
         Returns:
-        -------------
-            list: output of sample list.
+        --------
+        list
+            Sampled news list, padded with zeros if necessary
         """
         if ratio > len(news):
             return news + [0] * (ratio - len(news))
         else:
             return random.sample(news, ratio)
 
-
-    def load_data_from_file(self, train_set, npratio, batch_size):
+    def load_data_from_file(self, train_set, npratio: int, batch_size: int) -> Generator[Dict[str, np.ndarray], None, None]:
         """
-            Prepares and yields batches of training data from the given train_set, 
-            mapping user behavior (clicks and non-clicks) to news titles and labels.
-
-            This function processes the training dataset by extracting the user interactions 
-            with news items (clicks and non-clicks) and prepares batches of data suitable 
-            for training the NRMS model. It yields the data in batches based on the specified 
-            batch size.
-
-            Parameters:
-            -------------
-                train_set (object): The training dataset containing user interactions in 
-                CSR matrix format. Each row represents a user, with columns representing 
-                news articles, and values indicating whether the user clicked on the article.
-                - clicked_article_titles_dict (dict): Dictionary to store users' clicked article titles.
-
-            Yields:
-            -------------
-                batch (before calling _convert_data function):
-                    - label_list: List of labels indicating clicked news (1) and non-clicked news (0).
-                    - user_indexes: List of user indices corresponding to the batch.
-                    - candidate_title_indexes: List of indices of candidate news titles (clicked and non-clicked).
-                    - click_title_indexes: List of indices of news titles that users have previously clicked.
+        Prepares and yields batches of training data from the given train_set.
+        This is a memory-optimized generator that processes data in batches.
 
-            The process consists of the following steps:
-                1. Initialize user history and impression logs (news titles clicked by users) if not already done.
-                2. Retrieve positive and negative interaction items (news) for each user.
-                3. For each clicked (positive) item, sample negative items based on the negative-positive ratio (npratio).
-                4. Convert these positive and negative items into sequential word indices representing their news titles.
-                5. Retrieve and pad/truncate the user's history of clicked items to a fixed size.
-                6. Accumulate the processed data into batches, yielding each batch once the batch size is reached.
-                7. If any remaining data is left after the final batch, it yields the remaining data.
+        Parameters:
+        -----------
+        train_set : object
+            Training dataset containing user interactions in CSR matrix format
+        npratio : int
+            Negative sampling ratio (number of negative samples per positive sample)
+        batch_size : int
+            Size of each batch to yield
+
+        Yields:
+        -------
+        dict
+            Batch data containing:
+            - user_index_batch: User indices
+            - clicked_title_batch: Historical clicked news titles
+            - candidate_title_batch: Candidate news titles (positive + negative)
+            - labels: Binary labels (1 for positive, 0 for negative)
         """
-
+        # Initialize news data if not already done
         if not hasattr(self, "news_title_index") or self.news_title_index is None:
-            print("init news")
-            self.init_news( self.news_title)
+            print("Initializing news data...")
+            self.init_news(self.news_title)
         
-        # item od to Cornac ID
-        self.item_id2idx = {k: v for k, v in train_set.iid_map.items()}
-         # Cornac item ID to original item ID
-        self.item_idx2id = {v: k for k, v in train_set.iid_map.items()}
+        # Cache mappings to avoid repeated computation
+        if not self._mappings_cached:
+            self._cache_mappings(train_set)
+        
+        # Limit batch size for memory efficiency
+        effective_batch_size = min(batch_size, self.batch_memory_limit)
+        if effective_batch_size < batch_size:
+            print(f"Reducing batch size from {batch_size} to {effective_batch_size} for memory efficiency")
+        
+        # Use optimized batch generator
+        yield from self._optimized_batch_generator(train_set, npratio, effective_batch_size)
 
-        # original user ID to Cornac user ID
-        self.user_id2idx = {k: v for k, v in train_set.uid_map.items()}
+    def _cache_mappings(self, train_set) -> None:
+        """
+        Cache ID mappings to avoid repeated dictionary lookups.
+        
+        Parameters:
+        -----------
+        train_set : object
+            Training dataset containing ID mappings
+        """
+        # Original item ID to Cornac item ID
+        self.item_id2idx = train_set.iid_map
+        # Cornac item ID to original item ID
+        self.item_idx2id = {v: k for k, v in train_set.iid_map.items()}
+        
+        # Original user ID to Cornac user ID
+        self.user_id2idx = train_set.uid_map
         # Cornac user ID to original user ID
         self.user_idx2id = {v: k for k, v in train_set.uid_map.items()}
+        
+        self._mappings_cached = True
 
-        label_list = []
-
-        user_indexes = []
-        candidate_title_indexes = []
-        click_title_indexes = []
-
-        cnt = 0
+    def _optimized_batch_generator(self, train_set, npratio: int, batch_size: int) -> Generator[Dict[str, np.ndarray], None, None]:
+        """
+        Memory-optimized batch generator using pre-allocated arrays.
+        
+        Parameters:
+        -----------
+        train_set : object
+            Training dataset
+        npratio : int
+            Negative sampling ratio
+        batch_size : int
+            Batch size
+            
+        Yields:
+        -------
+        dict
+            Batch data dictionary
+        """
         if not hasattr(train_set, "uir_tuple"):
             raise ValueError("train_set does not contain the required 'uir_tuple' attribute.")
 
-        # train_set_user_indices = set(train_set.uir_tuple[0])
+        # Get all unique user indices and shuffle them
         train_set_user_indices = list(set(train_set.uir_tuple[0]))
         np.random.shuffle(train_set_user_indices)
 
+        # Pre-allocate numpy arrays for batch data (memory efficient)
+        batch_labels = np.zeros((batch_size, npratio + 1), dtype=np.float32)
+        batch_users = np.zeros((batch_size, 1), dtype=np.int32)
+        batch_candidates = np.zeros((batch_size, npratio + 1, self.title_size), dtype=np.int64)
+        batch_history = np.zeros((batch_size, self.history_size, self.title_size), dtype=np.int64)
+        
+        batch_idx = 0
+
         for user_idx in train_set_user_indices:
+            try:
+                # Get user's historical news titles (with caching)
+                his_for_user = self._get_cached_user_history(user_idx)
+
+                # Check if user has both positive and negative ratings
+                if (user_idx in self.impressionRating["positive_rating"] and 
+                    user_idx in self.impressionRating["negative_rating"]):
+                    
+                    train_pos_items = self.impressionRating["positive_rating"][user_idx]
+                    train_neg_items = self.impressionRating["negative_rating"][user_idx]
+
+                    if len(train_pos_items) > 0:
+                        for p in train_pos_items:
+                            # Create label: [1, 0, 0, ..., 0] for positive + negatives
+                            batch_labels[batch_idx, 0] = 1.0  # Positive sample
+                            batch_labels[batch_idx, 1:] = 0.0  # Negative samples
+                            
+                            # Set user index
+                            batch_users[batch_idx, 0] = user_idx
+                            
+                            # Sample negative items
+                            n = self.newsample(train_neg_items, npratio)
+                            candidate_keys = [p] + n
+                            
+                            # Fill candidate titles directly into pre-allocated array
+                            self._fill_candidate_titles(batch_candidates[batch_idx], candidate_keys)
+                            
+                            # Fill user history
+                            batch_history[batch_idx] = his_for_user
+                            
+                            # Cache click history for this user
+                            self.click_title_all_users[user_idx] = his_for_user
+                            
+                            batch_idx += 1
+
+                            # Yield batch when it's full
+                            if batch_idx >= batch_size:
+                                # yield {
+                                #     "user_index_batch": batch_users.copy(),
+                                #     "clicked_title_batch": batch_history.copy(),
+                                #     "candidate_title_batch": batch_candidates.copy(),
+                                #     "labels": batch_labels.copy(),
+                                # }
+                                yield {
+                                "user_index_batch": batch_users[:batch_idx],     
+                                "clicked_title_batch": batch_history[:batch_idx],
+                                "candidate_title_batch": batch_candidates[:batch_idx],
+                                "labels": batch_labels[:batch_idx],
+                            }
+                                
+                                # Reset batch index and clear arrays
+                                batch_idx = 0
+                                # batch_labels.fill(0)
+                                # batch_users.fill(0)
+                                # batch_candidates.fill(0)
+                                # batch_history.fill(0)
+                                
+                                # Periodic cache cleanup to prevent memory overflow
+                                self._periodic_cache_cleanup()
+
+            except Exception as e:
+                print(f"Error processing user {user_idx}: {e}")
+                continue
+
+        # Yield remaining data if any
+        if batch_idx > 0:
+            yield {
+        "user_index_batch": batch_users[:batch_idx],     # No .copy()
+        "clicked_title_batch": batch_history[:batch_idx], # No .copy()
+        "candidate_title_batch": batch_candidates[:batch_idx], # No .copy()
+        "labels": batch_labels[:batch_idx],              # No .copy()
+    }
+
+
+    def _get_cached_user_history(self, user_idx: int) -> np.ndarray:
+        """
+        Get user's historical news titles with caching for performance.
+        
+        Parameters:
+        -----------
+        user_idx : int
+            User index
+            
+        Returns:
+        --------
+        np.ndarray
+            User's historical news titles as word indices
+        """
+        if user_idx not in self.user_history_cache:
+            # Get original user ID and their history
             raw_UID = self.user_idx2id[user_idx]
-
             raw_IID = self.user_history[raw_UID]
-            his_for_user = self.process_history_news_title(raw_IID, self.hisory_size)
-
-            if user_idx in self.impressionRating["positive_rating"] and user_idx in self.impressionRating["negative_rating"]:
-                train_pos_items = self.impressionRating["positive_rating"][user_idx]
-
-                train_neg_items = self.impressionRating["negative_rating"][user_idx]
-
-                if len(train_pos_items) > 0:
-                    for p in train_pos_items:
-                        candidate_title_index = []
-                        user_index = []
-                        label = [1] + [0] * npratio
-                        user_index.append(user_idx)
-                        n = self.newsample(train_neg_items, npratio)
-                        # Convert `p` and `n` to sequential indices using `news_index_map`
-                        candidate_keys = [p] + n
-                        raw_item_ids = [self.item_idx2id[k] for k in candidate_keys]
-                        candidate_title_index = np.array(
-                            [self.news_title_index[self.news_index_map[key]] for key in raw_item_ids])
-
-                        click_title_index = his_for_user
-                        self.click_title_all_users[user_idx] = click_title_index
-
-                        candidate_title_indexes.append(candidate_title_index)
-                        click_title_indexes.append(click_title_index)
-                        user_indexes.append(user_index)
-                        label_list.append(label)
-                        cnt += 1
-                        
-
-            # cnt += 1
-                        if cnt >= batch_size:
-                            yield self._convert_data(
-                                label_list,
-                                user_indexes,
-                                candidate_title_indexes,
-                                click_title_indexes,
-                            )
-                            label_list = []
-                            user_indexes = []
-                            candidate_title_indexes = []
-                            click_title_indexes = []
-                            cnt = 0
-
-        if cnt > 0:
-            yield self._convert_data(
-                label_list,
-                user_indexes,
-                candidate_title_indexes,
-                click_title_indexes,
+            
+            # Process and cache the result
+            self.user_history_cache[user_idx] = self.process_history_news_title(
+                raw_IID, self.history_size
             )
+            
+        return self.user_history_cache[user_idx]
 
-
-    def _convert_data(
-            self,
-            label_list,
-            user_indexes,
-            candidate_title_indexes,
-            click_title_indexes,
-        ):
-        """Convert data into numpy arrays for further model operation.
+    def _fill_candidate_titles(self, batch_slot: np.ndarray, candidate_keys: List[int]) -> None:
+        """
+        Fill candidate news titles directly into pre-allocated array slot.
+        
+        Parameters:
+        -----------
+        batch_slot : np.ndarray
+            Pre-allocated array slot to fill
+        candidate_keys : list
+            List of candidate item keys
+        """
+        try:
+            # Convert candidate keys to raw item IDs
+            raw_item_ids = [self.item_idx2id[k] for k in candidate_keys]
+            
+            # Fill each candidate title
+            for i, raw_id in enumerate(raw_item_ids):
+                if raw_id in self.news_index_map:
+                    news_idx = self.news_index_map[raw_id]
+                    batch_slot[i] = self.news_title_index[news_idx]
+                else:
+                    # Fill with zeros if news not found
+                    batch_slot[i] = 0
+                    
+        except Exception as e:
+            print(f"Error filling candidate titles: {e}")
+            batch_slot.fill(0)
+
+    def _periodic_cache_cleanup(self) -> None:
+        """
+        Periodically clean up caches to prevent memory overflow.
+        """
+        # Clean user history cache if it gets too large
+        while len(self.user_history_cache) > self.max_cache_size:
+            self.user_history_cache.popitem(last=False)  # Remove oldest, no temp list
+        
+        while len(self.news_tokenization_cache) > self.max_cache_size:
+            self.news_tokenization_cache.popitem(last=False)  # Remove oldest, no temp list
+        # if len(self.user_history_cache) > self.max_cache_size:
+        #     # Keep only the most recent half of the cache
+        #     items = list(self.user_history_cache.items())
+        #     self.user_history_cache = dict(items[len(items)//2:])
+            
+        # # Clean news tokenization cache if it gets too large
+        # if len(self.news_tokenization_cache) > self.max_cache_size:
+        #     items = list(self.news_tokenization_cache.items())
+        #     self.news_tokenization_cache = dict(items[len(items)//2:])
+
+    def _convert_data(self, label_list: List[List[int]], user_indexes: List[List[int]], 
+                     candidate_title_indexes: List[np.ndarray], 
+                     click_title_indexes: List[np.ndarray]) -> Dict[str, np.ndarray]:
+        """
+        Convert data lists into numpy arrays for model operation.
+        
+        Note: This method is kept for backward compatibility but is not used
+        in the optimized batch generator.
 
         Parameters:
-            label_list (list): a list of ground-truth labels.
-            user_indexes (list): a list of user indexes.
-            candidate_title_indexes (list): the candidate news titles' words indices.
-            click_title_indexes (list): words indices for user's clicked news titles.
+        -----------
+        label_list : list
+            List of ground-truth labels
+        user_indexes : list
+            List of user indexes
+        candidate_title_indexes : list
+            List of candidate news titles' word indices
+        click_title_indexes : list
+            List of word indices for user's clicked news titles
 
         Returns:
-            dict: A dictionary, containing multiple numpy arrays that are convenient for further operation.
+        --------
+        dict
+            Dictionary containing numpy arrays for model input
         """
-
         labels = np.asarray(label_list, dtype=np.float32)
         user_indexes = np.asarray(user_indexes, dtype=np.int32)
-        candidate_title_index_batch = np.asarray(
-            candidate_title_indexes, dtype=np.int64
-        )
-        click_title_index_batch = np.asarray(
-            click_title_indexes, dtype=np.int64)
+        candidate_title_index_batch = np.asarray(candidate_title_indexes, dtype=np.int64)
+        click_title_index_batch = np.asarray(click_title_indexes, dtype=np.int64)
+        
         return {
             "user_index_batch": user_indexes,
             "clicked_title_batch": click_title_index_batch,
@@ -187,147 +360,199 @@ def _convert_data(
             "labels": labels,
         }
 
-    def map_news_titles_to_Cornac_internal_ids(self, train_set, news_original_id_to_news_title):
-
-        # original item ID to Cornac item ID
-        self.item_id2idx = {k: v for k, v in train_set.iid_map.items()}
-        # Cornac item ID to original item ID
+    def map_news_titles_to_Cornac_internal_ids(self, train_set, news_original_id_to_news_title: Dict[Any, str]) -> Dict[int, str]:
+        """
+        Map news titles from original IDs to Cornac internal IDs.
+        
+        Parameters:
+        -----------
+        train_set : object
+            Training dataset containing ID mappings
+        news_original_id_to_news_title : dict
+            Dictionary mapping original news IDs to news titles
+            
+        Returns:
+        --------
+        dict
+            Dictionary mapping Cornac internal IDs to news titles
+        """
+        # Cache ID mappings
+        self.item_id2idx = train_set.iid_map
         self.item_idx2id = {v: k for k, v in train_set.iid_map.items()}
-
-        # original user ID to Cornac user ID
-        self.user_id2idx = {k: v for k, v in train_set.uid_map.items()}
-        # Cornac user ID to original user ID
+        self.user_id2idx = train_set.uid_map
         self.user_idx2id = {v: k for k, v in train_set.uid_map.items()}
+        
+        # Create feature map with internal IDs
         feature_map = {}
         for key, value in news_original_id_to_news_title.items():
             if key in self.item_id2idx:
                 idx = self.item_id2idx[key]
                 feature_map[idx] = value
-            # feature_map[key] = value
-        missing_keys = set(self.item_id2idx.values()) - set(feature_map.keys())
-
 
+        # Check for missing keys and report
+        missing_keys = set(self.item_id2idx.values()) - set(feature_map.keys())
+        
         if not missing_keys:
-            print("All keys in item_id2idx are present in feature_map.")
+            print("✓ All keys in item_id2idx are present in feature_map.")
         else:
-            print(f"Missing keys in feature_map: {missing_keys}")
-            raw_ids = [self.item_idx2id[id0] for id0 in missing_keys]
-            print(f"Missing raw item titles: {raw_ids}")
+            print(f"⚠ Missing keys in feature_map: {len(missing_keys)} items")
+            if len(missing_keys) <= 10:  # Only print if not too many
+                raw_ids = [self.item_idx2id[id0] for id0 in missing_keys]
+                print(f"Missing raw item IDs: {raw_ids}")
 
         return feature_map
-    
 
-    def process_history_news_title(self, history_raw_IID, history_size):
-        """init news information given news file, such as news_title_index.
-        Args:
-            news_file: path of news file
-            history_raw_IID: raw item ids for a user
-            history_size: the fixed history size to keep.
+    def process_history_news_title(self, history_raw_IID: List[int], history_size: int) -> np.ndarray:
         """
-
-        news_title = {}
-        # original_UID = self.user_idx2id[user_idx]
-        # get user History item ids
-        # his_original_IID = self.userHistory[original_UID]
-
-        def pad_or_truncate(sequence, max_length):
+        Process user's historical news titles into word index matrix.
+        
+        Parameters:
+        -----------
+        history_raw_IID : list
+            List of raw item IDs from user's history
+        history_size : int
+            Fixed history size to maintain
+            
+        Returns:
+        --------
+        np.ndarray
+            Matrix of word indices for historical news titles
+        """
+        def pad_or_truncate(sequence: List[int], max_length: int) -> List[int]:
+            """Pad with -1 or truncate sequence to desired length."""
             if len(sequence) < max_length:
-                # Pad with -1 if the sequence is too short
                 return [-1] * (max_length - len(sequence)) + sequence
             else:
-                # Truncate the sequence if it's too long
                 return sequence[-max_length:]
 
+        # Normalize history length
         history_raw_IID = pad_or_truncate(history_raw_IID, history_size)
-        news_json = []
-        for i in history_raw_IID:
-            if i in self.news_title:
-                news_json.append(self.news_title[i])
-            elif i == -1:
-
-                news_json.append("")
-
-        news_title = []
-        for value in news_json:
-
-            title = self.word_tokenize(value)
-            news_title.append(title)
-
-        his_index = np.zeros(
-            (len(news_title), self.title_size), dtype="int32"
-        )
-        # total news_title * word size
-        for i in range(len(news_title)):
-            title = news_title[i]
+        
+        # Collect news titles for each item in history
+        news_titles = []
+        for item_id in history_raw_IID:
+            if item_id in self.news_title:
+                # Use cached tokenization if available
+                if item_id not in self.news_tokenization_cache:
+                    self.news_tokenization_cache[item_id] = self.word_tokenize(self.news_title[item_id])
+                news_titles.append(self.news_tokenization_cache[item_id])
+            elif item_id == -1:
+                news_titles.append([])  # Empty title for padding
+            else:
+                news_titles.append([])  # Unknown item, treat as empty
+
+        # Convert to word index matrix
+        his_index = np.zeros((len(news_titles), self.title_size), dtype=np.int32)
+        
+        for i, title in enumerate(news_titles):
             for word_index in range(min(self.title_size, len(title))):
                 word = title[word_index].lower()
                 if word in self.word_dict:
                     his_index[i, word_index] = self.word_dict[word]
+                    
         return his_index
 
-    
-
-    def init_news(self, news_title_json):
-        """init news information given news file, such as news_title_index.
-        Args:
-            news_file: path of news file
+    def init_news(self, news_title_json: Dict[Any, str]) -> None:
         """
-        news_title = {}
-        # news_json = self.map_news_titles_to_Cornac_internal_ids(train_set,
-        #     news_title_json)
-        news_json = news_title_json
-
+        Initialize news information including news title indices.
+        
+        Parameters:
+        -----------
+        news_title_json : dict
+            Dictionary mapping news IDs to news titles
+        """
+        print("Initializing news title indices...")
+        
+        # Create a copy and ensure we have empty title for -1 (padding)
+        news_json = news_title_json.copy()
         news_json[-1] = ""
-        # Map cornac ID to a sequential index
-        self.news_index_map = {key: idx for idx,
-                               key in enumerate(news_json.keys())}
-
-
+        
+        # Create sequential index mapping for news
+        self.news_index_map = {key: idx for idx, key in enumerate(news_json.keys())}
+        
+        # Tokenize all news titles and cache results
+        news_title_tokens = {}
         for key, value in news_json.items():
-           
             if key == -1:
-                news_title[key] = ""
+                news_title_tokens[key] = []  # Empty for padding
             else:
-                title = self.word_tokenize(value)
-                news_title[key] = title
-            # if key > -1:
-            #     title = self.word_tokenize(value)
-            #     news_title[key] = title
-            # elif key == -1:
-            #     news_title[key] = ""
-        # for "", news_title[-1] = [] empty list
-
-        self.news_title_index = np.zeros(
-            (len(news_title), self.title_size), dtype="int32"
-        )
-        for key, title in news_title.items():
+                tokens = self.word_tokenize(value)
+                news_title_tokens[key] = tokens
+                # Cache tokenized version
+                self.news_tokenization_cache[key] = tokens
+
+        # Create word index matrix for all news
+        self.news_title_index = np.zeros((len(news_title_tokens), self.title_size), dtype=np.int32)
+        
+        for key, title_tokens in news_title_tokens.items():
             mapped_index = self.news_index_map[key]
-            for word_index in range(min(self.title_size, len(title))):
-                word = title[word_index].lower()
+            for word_index in range(min(self.title_size, len(title_tokens))):
+                word = title_tokens[word_index].lower()
                 if word in self.word_dict:
-                    self.news_title_index[mapped_index,
-                                          word_index] = self.word_dict[word]
-        # print(f"self.news_index_map:{self.news_index_map}")  
-        # print(f"self.news_title_index:{self.news_title_index}")   
+                    self.news_title_index[mapped_index, word_index] = self.word_dict[word]
+                    
+        print(f"✓ Initialized {len(news_title_tokens)} news titles")
 
-    def word_tokenize(self, sent):
-        """Split sentence into word list using regex.
+    def word_tokenize(self, sent: str) -> List[str]:
+        """
+        Split sentence into word list using regex.
+        
         Parameters:
-        ------------
-            sent (str): Input sentence
-
-        Return:
-        ------------
-            list: word list
+        -----------
+        sent : str
+            Input sentence
+            
+        Returns:
+        --------
+        list
+            List of words/tokens
         """
-        pat = re.compile(r"[\w]+|[.,!?;|]")
+        # pat = re.compile(r"[\w]+|[.,!?;|]")
+        # if isinstance(sent, str):
+        #     return pat.findall(sent.lower())
         if isinstance(sent, str):
-            return pat.findall(sent.lower())
+            return self._word_pattern.findall(sent.lower())
         else:
             return []
 
-
+    def clear_cache(self) -> None:
+        """
+        Clear all caches to free up memory.
+        """
+        self.user_history_cache.clear()
+        self.news_tokenization_cache.clear()
+        self.click_title_all_users.clear()
         
+        # Force garbage collection
+        gc.collect()
+        print("✓ Cleared all caches")
 
-            
+    def optimize_memory_usage(self) -> None:
+        """
+        Optimize memory usage by adjusting cache sizes and cleaning up.
+        """
+        # Reduce cache sizes
+        self.max_cache_size = 500
+        self.batch_memory_limit = 8
+        
+        # Clean up large caches
+        self._periodic_cache_cleanup()
+        
+        print(f"✓ Optimized memory usage - cache limit: {self.max_cache_size}, batch limit: {self.batch_memory_limit}")
 
+    def get_memory_stats(self) -> Dict[str, int]:
+        """
+        Get current memory usage statistics.
+        
+        Returns:
+        --------
+        dict
+            Dictionary with cache sizes and memory usage info
+        """
+        return {
+            "user_history_cache_size": len(self.user_history_cache),
+            "news_tokenization_cache_size": len(self.news_tokenization_cache),
+            "click_title_cache_size": len(self.click_title_all_users),
+            "max_cache_size": self.max_cache_size,
+            "batch_memory_limit": self.batch_memory_limit
+        }
\ No newline at end of file
diff --git a/docs/source/conf.py b/docs/source/conf.py
index f800b91..d083de9 100644
--- a/docs/source/conf.py
+++ b/docs/source/conf.py
@@ -12,19 +12,20 @@
 #
 import os
 import sys
-sys.path.append(os.path.abspath('../..'))
+
+sys.path.append(os.path.abspath("../.."))
 
 
 # -- Project information -----------------------------------------------------
 
-project = 'Cornac'
-copyright = '2023, Preferred.AI'
-author = 'Preferred.AI'
+project = "Cornac"
+copyright = "2023, Preferred.AI"
+author = "Preferred.AI"
 
 # The short X.Y version
-version = '2.3'
+version = "2.3"
 # The full version, including alpha/beta/rc tags
-release = '2.3.0'
+release = "2.3.3"
 
 
 # -- General configuration ---------------------------------------------------
@@ -33,28 +34,28 @@
 # extensions coming with Sphinx (named 'sphinx.ext.*') or your custom
 # ones.
 extensions = [
-    'sphinx.ext.autodoc',
-    'sphinx.ext.intersphinx',
-    'sphinx.ext.ifconfig',
-    'sphinx.ext.viewcode',
-    'sphinx.ext.autosummary',
-    'sphinx.ext.doctest',
-    'sphinx.ext.todo',
-    'sphinx.ext.coverage',
-    'sphinx.ext.mathjax',
-    'sphinx.ext.napoleon',
-    'sphinx_design',
-    'myst_parser',
-    'sphinx_copybutton'
+    "sphinx.ext.autodoc",
+    "sphinx.ext.intersphinx",
+    "sphinx.ext.ifconfig",
+    "sphinx.ext.viewcode",
+    "sphinx.ext.autosummary",
+    "sphinx.ext.doctest",
+    "sphinx.ext.todo",
+    "sphinx.ext.coverage",
+    "sphinx.ext.mathjax",
+    "sphinx.ext.napoleon",
+    "sphinx_design",
+    "myst_parser",
+    "sphinx_copybutton",
 ]
 
 # Add any paths that contain templates here, relative to this directory.
-templates_path = ['_templates']
+templates_path = ["_templates"]
 
 # List of patterns, relative to source directory, that match files and
 # directories to ignore when looking for source files.
 # This pattern also affects html_static_path and html_extra_path.
-exclude_patterns = ['_build', 'Thumbs.db', '.DS_Store']
+exclude_patterns = ["_build", "Thumbs.db", ".DS_Store"]
 
 
 # -- Options for HTML output -------------------------------------------------
@@ -62,7 +63,7 @@
 # The theme to use for HTML and HTML Help pages.  See the documentation for
 # a list of builtin themes.
 #
-html_theme = 'pydata_sphinx_theme'
+html_theme = "pydata_sphinx_theme"
 
 # Add any paths that contain custom static files (such as style sheets) here,
 # relative to this directory. They are copied after the builtin static files,
@@ -104,7 +105,7 @@
         "**": ["page-toc", "sourcelink"],
         "index": [],
         "models/index": [],
-    }
+    },
 }
 
 html_sidebars = {
@@ -115,4 +116,4 @@
 # -- Options for intersphinx extension ---------------------------------------
 
 # Example configuration for intersphinx: refer to the Python standard library.
-intersphinx_mapping = {'python': ('https://docs.python.org/3', None)}
+intersphinx_mapping = {"python": ("https://docs.python.org/3", None)}
diff --git a/examples/README.md b/examples/README.md
index 74a71c5..b384a03 100644
--- a/examples/README.md
+++ b/examples/README.md
@@ -18,7 +18,7 @@
 
 [param_search.py](param_search.py) - Hyper-parameter tuning with GridSearch and RandomSearch.
 
----
+----
 
 ## Multimodal Algorithms (Using Auxiliary Data)
 
@@ -32,16 +32,10 @@
 
 [lightgcn_example.py](lightgcn_example.py) - LightGCN example with CiteULike dataset.
 
-[gcmc_example.py](gcmc_example.py) - Graph Convolutional Matrix Completion (GCMC) example with MovieLens 100K dataset.
-
-[lightgcn_example.py](lightgcn_example.py) - LightGCN example with CiteULike dataset.
-
 [mcf_office.py](mcf_office.py) - Fit Matrix Co-Factorization (MCF) to the Amazon Office dataset.
 
 [ngcf_example.py](ngcf_example.py) - NGCF example with CiteULike dataset.
 
-[ngcf_example.py](ngcf_example.py) - NGCF example with CiteULike dataset.
-
 [pcrl_example.py](pcrl_example.py) - Probabilistic Collaborative Representation Learning (PCRL) Amazon Office dataset.
 
 [sbpr_epinions.py](sbpr_epinions.py) - Social Bayesian Personalized Ranking (SBPR) with Epinions dataset.
@@ -56,8 +50,6 @@
 
 [companion_example.py](companion_example.py) - Comparative Aspects and Opinions Ranking for Recommendation Explanations (Companion) with Amazon Toy and Games dataset.
 
-[companion_example.py](companion_example.py) - Comparative Aspects and Opinions Ranking for Recommendation Explanations (Companion) with Amazon Toy and Games dataset.
-
 [conv_mf_example.py](conv_mf_example.py) - Convolutional Matrix Factorization (ConvMF) with MovieLens dataset.
 
 [ctr_example_citeulike.py](ctr_example_citeulike.py) - Collaborative Topic Regression (CTR) with CiteULike dataset.
@@ -68,18 +60,12 @@
 
 [trirank_example.py](trirank_example.py) - TriRank with Amazon Toy and Games dataset.
 
-[dmrl_example.py](dmrl_example.py) - Disentangled Multimodal Representation Learning (DMRL) with citeulike dataset.
-
-[trirank_example.py](trirank_example.py) - TriRank with Amazon Toy and Games dataset.
-
 [efm_example.py](efm_example.py) - Explicit Factor Model (EFM) with Amazon Toy and Games dataset.
 
 [hft_example.py](hft_example.py) - Hidden Factor Topic (HFT) with MovieLen 1m dataset.
 
 [lrppm_example.py](lrppm_example.py) - Learn to Rank user Preferences based on Phrase-level sentiment analysis across Multiple categories (LRPPM) with Amazon Toy and Games dataset.
 
-[lrppm_example.py](lrppm_example.py) - Learn to Rank user Preferences based on Phrase-level sentiment analysis across Multiple categories (LRPPM) with Amazon Toy and Games dataset.
-
 [mter_example.py](mter_example.py) - Multi-Task Explainable Recommendation (MTER) with Amazon Toy and Games dataset.
 
 ### Image
@@ -88,8 +74,6 @@
 
 [dmrl_clothes_example.py](dmrl_clothes_example.py) - Disentangled Multimodal Representation Learning (DMRL) with Amazon clothing dataset.
 
-[dmrl_clothes_example.py](dmrl_clothes_example.py) - Disentangled Multimodal Representation Learning (DMRL) with Amazon clothing dataset.
-
 [vbpr_tradesy.py](vbpr_tradesy.py) - Visual Bayesian Personalized Ranking (VBPR) with Tradesy dataset.
 
 [vmf_clothing.py](vmf_clothing.py) - Visual Matrix Factorization (VMF) with Amazon Clothing dataset.
@@ -120,7 +104,9 @@
 
 [recvae_example.py](recvae_example.py) - New Variational Autoencoder for Top-N Recommendations with Implicit Feedback (RecVAE).
 
-[recvae_example.py](recvae_example.py) - New Variational Autoencoder for Top-N Recommendations with Implicit Feedback (RecVAE).
+[sansa_movielens.py](sansa_movielens.py) - Scalable Approximate NonSymmetric Autoencoder (SANSA) with MovieLens 1M dataset.
+
+[sansa_tradesy.py](sansa_movielens.py) - Scalable Approximate NonSymmetric Autoencoder (SANSA) with Tradesy dataset.
 
 [skm_movielens.py](skm_movielens.py) - SKMeans vs BPR on MovieLens data.
 
@@ -151,31 +137,3 @@
 [tifuknn_tafeng.py](tifuknn_tafeng.py) - Example of Temporal-Item-Frequency-based User-KNN (TIFUKNN).
 
 [upcf_tafeng.py](upcf_tafeng.py) - Example of Recency Aware Collaborative Filtering for Next Basket Recommendation (UPCF).
-
-[dae_movielens.py](dae_movielens.py) - Denoising Autoencoder with Movielens dataset
-
----
-
-## Experiment Scripts (Standard Sequential Workflow with Reranking)
-
-These scripts follow a standard sequential evaluation workflow where the model is trained, reranked, and evaluated without intermediate checkpointing or modular execution.
-
-- **[standard_dae_reranking_workflow.py](standard_dae_reranking_workflow.py)** - Implements the Multinomial Denoising Autoencoder (DAE) with reranking.
-- **[standard_drdw_workflow.py](standard_drdw_workflow.py)** - Executes the Diversity-Driven Random Walk model (D-RDW).
-- **[standard_mostpop_reranking_workflow.py](standard_mostpop_reranking_workflow.py)** - Applies the MostPop (Most Popular) model with reranking.
-- **[standard_nrms_reranking_workflow.py](standard_nrms_reranking_workflow.py)** - Utilizes the Neural News Recommendation model with Multi-Head Self-Attention (NRMS) along with reranking.
-
----
-
-## Pipeline Experiment Scripts (Flexible Modular Workflow with Reranking)
-
-Pipeline experiment scripts enable modular experimentation by supporting flexibility to skip steps, load pre-generated recommendations, and configure the workflow via `.ini` files.
-
-- **[pipeline_dae_reranking_workflow.py](pipeline_dae_reranking_workflow.py)** - Modular pipeline for the Multinomial Denoising Autoencoder (DAE) with reranking.
-- **[pipeline_drdw_workflow.py](pipeline_drdw_workflow.py)** - Flexible pipeline experiment for the Diversity-Driven Random Walk model (D-RDW).
-- **[pipeline_mostpop_reranking_workflow.py](pipeline_mostpop_reranking_workflow.py)** - Modular pipeline for the Most Popular (MostPop) model with reranking.
-- **[pipeline_nrms_reranking_workflow.py](pipeline_nrms_reranking_workflow.py)** - Pipeline experiment for the Neural News Recommendation model with Multi-Head Self-Attention (NRMS) with reranking.
-- **[pipeline_epd_reranking_workflow.py](pipeline_epd_reranking_workflow.py)** - Pipeline for the EPD model with reranking. The EPD model is based on the reference paper: _Deliberative Diversity for News Recommendations: Operationalization and Experimental User Study_. Note: The EPD codebase is not included here; recommendations are generated using another team's Cornac implementation.
-
-- **[pipeline_pld_reranking_workflow.py](pipeline_pld_reranking_workflow.py)** - Pipeline experiment for the PLD model with reranking. The PLD model is based on the reference paper: _Benefits of Diverse News Recommendations for Democracy: A User Study_. Note: The PLD model is not integrated here; recommendations are generated using another team's Cornac implementation.
-- **[pipeline_rdw_reranking_workflow.py](pipeline_rdw_reranking_workflow.py)** - Pipeline experiment for the RDW model with reranking. The RDW model is introduced in the reference paper: _Blockbusters and Wallflowers: Accurate, Diverse, and Scalable Recommendations with Random Walks_. Note: The RDW codebase is not included here; recommendations are generated using another team's Cornac implementation.
diff --git a/examples/example_lstur_news_reranking.py b/examples/example_lstur_news_reranking.py
index 4ecfaaa..4670430 100644
--- a/examples/example_lstur_news_reranking.py
+++ b/examples/example_lstur_news_reranking.py
@@ -23,17 +23,17 @@
 # ============================================================================
 
 import tensorflow as tf
-tf.compat.v1.disable_eager_execution()
 tf.get_logger().setLevel('INFO')
 tf.autograph.set_verbosity(0)
 
 import logging
 tf.get_logger().setLevel(logging.ERROR)
-
-import logging, os
 logging.disable(logging.WARNING)
+
+import os
+# Set environment variables
 os.environ["TF_CPP_MIN_LOG_LEVEL"] = "3"
-os.environ["CUDA_VISIBLE_DEVICES"] = "7"
+os.environ["CUDA_VISIBLE_DEVICES"] = "0"
 
 import warnings
 warnings.simplefilter(action='ignore', category=FutureWarning)
@@ -53,8 +53,6 @@
 from cornac.metrics import NDCG, AUC, MRR
 from cornac.metrics import GiniCoeff, ILD, EILD, Precision, Activation, Calibration, Fragmentation, Representation, AlternativeVoices, Alpha_NDCG, Binomial
 from cornac.datasets import mind as mind
-from cornac.rerankers import GreedyKLReranker
-from cornac.rerankers.pm2 import PM2Reranker
 
 from cornac.models import LSTUR
 from cornac.rerankers import GreedyKLReranker, PM2Reranker, MMR_ReRanker, DynamicAttrReRanker
@@ -149,23 +147,7 @@ def main():
 
     
     ### generating one-hot encoding vectors for sentiment and party
-    ### Adjust based on your need
-    def sentiment_to_one_hot(score):
-        if -1 <= score < -0.5:
-            return [1, 0, 0, 0]
-        elif -0.5 <= score < 0:
-            return [0, 1, 0, 0]
-        elif 0 <= score < 0.5:
-            return [0, 0, 1, 0]
-        elif 0.5 <= score <= 1:
-            return [0, 0, 0, 1]
-
-    # Apply the function to each sentiment value
-    one_hot_encoded = {key: sentiment_to_one_hot(value) for key, value in sentiment.items()}
-
-    # Save the result to a new JSON file
-    with open(f"{input_path}/combined_sentiment_one_hot.json", "w", encoding="utf-8") as f:
-        json.dump(one_hot_encoded, f, indent=4)
+    ### Adjust based on your needs
 
     def sentiment_to_one_hot(score):
         if -1 <= score < -0.5:
@@ -256,7 +238,7 @@ def party_to_one_hot(mentioned_parties):
     Target_Mind_distribution = {
             "sentiment": {"type": "continuous", "distr": [
                 {"min": -1, "max": -0.5, "prob": 0.25},
-                {"min": -0.5, "max": 0, "prob": 25},
+                {"min": -0.5, "max": 0, "prob": 0.25},
                 {"min": 0, "max": 0.5, "prob": 0.25},
                 {"min": 0.5, "max": 1.01, "prob": 0.25}
             ]},
diff --git a/examples/example_npa_news_reranking.py b/examples/example_npa_news_reranking.py
index c86fa94..b4389c4 100644
--- a/examples/example_npa_news_reranking.py
+++ b/examples/example_npa_news_reranking.py
@@ -23,17 +23,16 @@
 # ============================================================================
 
 import tensorflow as tf
-tf.compat.v1.disable_eager_execution()
 tf.get_logger().setLevel('INFO')
 tf.autograph.set_verbosity(0)
 
 import logging
 tf.get_logger().setLevel(logging.ERROR)
-
-import logging, os
 logging.disable(logging.WARNING)
+
+import os
 os.environ["TF_CPP_MIN_LOG_LEVEL"] = "3"
-os.environ["CUDA_VISIBLE_DEVICES"] = "7"
+os.environ["CUDA_VISIBLE_DEVICES"] = "0"
 
 import warnings
 warnings.simplefilter(action='ignore', category=FutureWarning)
@@ -53,8 +52,6 @@
 from cornac.metrics import NDCG, AUC, MRR
 from cornac.metrics import GiniCoeff, ILD
 from cornac.datasets import mind as mind
-from cornac.rerankers import GreedyKLReranker
-from cornac.rerankers.pm2 import PM2Reranker
 
 from cornac.models import NPA
 from cornac.rerankers import GreedyKLReranker, PM2Reranker, MMR_ReRanker, DynamicAttrReRanker
@@ -168,23 +165,7 @@ def main():
 
     
     ### generating one-hot encoding vectors for sentiment and party
-    ### Adjust based on your need
-    def sentiment_to_one_hot(score):
-        if -1 <= score < -0.5:
-            return [1, 0, 0, 0]
-        elif -0.5 <= score < 0:
-            return [0, 1, 0, 0]
-        elif 0 <= score < 0.5:
-            return [0, 0, 1, 0]
-        elif 0.5 <= score <= 1:
-            return [0, 0, 0, 1]
-
-    # Apply the function to each sentiment value
-    one_hot_encoded = {key: sentiment_to_one_hot(value) for key, value in sentiment.items()}
-
-    # Save the result to a new JSON file
-    with open(f"{input_path}/combined_sentiment_one_hot.json", "w", encoding="utf-8") as f:
-        json.dump(one_hot_encoded, f, indent=4)
+ 
 
     def sentiment_to_one_hot(score):
         if -1 <= score < -0.5:
@@ -275,7 +256,7 @@ def party_to_one_hot(mentioned_parties):
     Target_Mind_distribution = {
             "sentiment": {"type": "continuous", "distr": [
                 {"min": -1, "max": -0.5, "prob": 0.25},
-                {"min": -0.5, "max": 0, "prob": 25},
+                {"min": -0.5, "max": 0, "prob": 0.25},
                 {"min": 0, "max": 0.5, "prob": 0.25},
                 {"min": 0.5, "max": 1.01, "prob": 0.25}
             ]},
diff --git a/examples/example_nrms_news_reranking.py b/examples/example_nrms_news_reranking.py
index 3e383be..228e7d6 100644
--- a/examples/example_nrms_news_reranking.py
+++ b/examples/example_nrms_news_reranking.py
@@ -23,15 +23,15 @@
 # ============================================================================
 
 import tensorflow as tf
-tf.compat.v1.disable_eager_execution()
+
 tf.get_logger().setLevel('INFO')
 tf.autograph.set_verbosity(0)
 
 import logging
 tf.get_logger().setLevel(logging.ERROR)
-
-import logging, os
 logging.disable(logging.WARNING)
+
+import os
 os.environ["TF_CPP_MIN_LOG_LEVEL"] = "3"
 os.environ["CUDA_VISIBLE_DEVICES"] = "0"
 
@@ -53,8 +53,6 @@
 from cornac.metrics import NDCG, AUC, MRR
 from cornac.metrics import GiniCoeff, ILD, EILD, Precision, Activation, Calibration, Fragmentation, Representation, AlternativeVoices, Alpha_NDCG, Binomial
 from cornac.datasets import mind as mind
-from cornac.rerankers import GreedyKLReranker
-from cornac.rerankers.pm2 import PM2Reranker
 
 from cornac.models import NRMS
 from cornac.rerankers import GreedyKLReranker, PM2Reranker, MMR_ReRanker, DynamicAttrReRanker
@@ -142,23 +140,6 @@ def main():
 
     
     ### generating one-hot encoding vectors for sentiment and party
-    ### Adjust based on your need
-    def sentiment_to_one_hot(score):
-        if -1 <= score < -0.5:
-            return [1, 0, 0, 0]
-        elif -0.5 <= score < 0:
-            return [0, 1, 0, 0]
-        elif 0 <= score < 0.5:
-            return [0, 0, 1, 0]
-        elif 0.5 <= score <= 1:
-            return [0, 0, 0, 1]
-
-    # Apply the function to each sentiment value
-    one_hot_encoded = {key: sentiment_to_one_hot(value) for key, value in sentiment.items()}
-
-    # Save the result to a new JSON file
-    with open(f"{input_path}/combined_sentiment_one_hot.json", "w", encoding="utf-8") as f:
-        json.dump(one_hot_encoded, f, indent=4)
 
     def sentiment_to_one_hot(score):
         if -1 <= score < -0.5:
@@ -249,7 +230,7 @@ def party_to_one_hot(mentioned_parties):
     Target_Mind_distribution = {
             "sentiment": {"type": "continuous", "distr": [
                 {"min": -1, "max": -0.5, "prob": 0.25},
-                {"min": -0.5, "max": 0, "prob": 25},
+                {"min": -0.5, "max": 0, "prob": 0.25},
                 {"min": 0, "max": 0.5, "prob": 0.25},
                 {"min": 0.5, "max": 1.01, "prob": 0.25}
             ]},
diff --git a/examples/sansa_movielens.py b/examples/sansa_movielens.py
new file mode 100644
index 0000000..381fdbd
--- /dev/null
+++ b/examples/sansa_movielens.py
@@ -0,0 +1,60 @@
+"""Example SANSA (Scalable Approximate NonSymmetric Autoencoder for Collaborative Filtering) on MovieLens data"""
+
+import cornac
+from cornac.datasets import movielens
+from cornac.eval_methods import RatioSplit
+
+
+# Load user-item feedback
+data = movielens.load_feedback(variant="1M")
+
+# Instantiate an evaluation method to split data into train and test sets.
+ratio_split = RatioSplit(
+    data=data,
+    test_size=0.2,
+    exclude_unknowns=True,
+    verbose=True,
+    seed=123,
+)
+
+sansa_cholmod = cornac.models.SANSA(
+    name="SANSA (CHOLMOD)",
+    l2=500.0,
+    weight_matrix_density=1e-2,
+    compute_gramian=True,
+    factorizer_class="CHOLMOD",
+    factorizer_shift_step=1e-3,
+    factorizer_shift_multiplier=2.0,
+    inverter_scans=5,
+    inverter_finetune_steps=20,
+    use_absolute_value_scores=False,
+)
+
+sansa_icf = cornac.models.SANSA(
+    name="SANSA (ICF)",
+    l2=10.0,
+    weight_matrix_density=1e-2,
+    compute_gramian=True,
+    factorizer_class="ICF",
+    factorizer_shift_step=1e-3,
+    factorizer_shift_multiplier=2.0,
+    inverter_scans=5,
+    inverter_finetune_steps=20,
+    use_absolute_value_scores=False,
+)
+
+
+# Instantiate evaluation measures
+rec_20 = cornac.metrics.Recall(k=20)
+rec_50 = cornac.metrics.Recall(k=50)
+ndcg_100 = cornac.metrics.NDCG(k=100)
+
+
+# Put everything together into an experiment and run it
+cornac.Experiment(
+    eval_method=ratio_split,
+    models=[sansa_cholmod, sansa_icf],
+    metrics=[rec_20, rec_50, ndcg_100],
+    user_based=True,  # If `False`, results will be averaged over the number of ratings.
+    save_dir=None,
+).run()
diff --git a/examples/sansa_tradesy.py b/examples/sansa_tradesy.py
new file mode 100644
index 0000000..e370485
--- /dev/null
+++ b/examples/sansa_tradesy.py
@@ -0,0 +1,39 @@
+"""
+Example SANSA (Scalable Approximate NonSymmetric Autoencoder for Collaborative Filtering) on Tradesy data
+Original data: http://jmcauley.ucsd.edu/data/tradesy/
+"""
+
+import cornac
+from cornac.datasets import tradesy
+from cornac.eval_methods import RatioSplit
+
+feedback = tradesy.load_feedback()
+
+# Define an evaluation method to split feedback into train and test sets
+ratio_split = RatioSplit(
+    data=feedback,
+    test_size=0.1,
+    rating_threshold=0.5,
+    exclude_unknowns=True,
+    verbose=True,
+)
+
+sansa_icf = cornac.models.SANSA(
+    name="SANSA (ICF)",
+    l2=20.0,
+    weight_matrix_density=1e-3,
+    compute_gramian=True,
+    factorizer_class="ICF",
+    factorizer_shift_step=1e-3,
+    factorizer_shift_multiplier=2.0,
+    inverter_scans=0,
+    inverter_finetune_steps=5,
+    use_absolute_value_scores=True,  # see https://dl.acm.org/doi/abs/10.1145/3640457.3688179 why this helps on sparse data
+)
+
+# Instantiate evaluation measures
+auc = cornac.metrics.AUC()
+rec_50 = cornac.metrics.Recall(k=50)
+
+# Put everything together into an experiment and run it
+cornac.Experiment(eval_method=ratio_split, models=[sansa_icf], metrics=[auc, rec_50]).run()
diff --git a/pyproject.toml b/pyproject.toml
new file mode 100644
index 0000000..2f67e99
--- /dev/null
+++ b/pyproject.toml
@@ -0,0 +1,57 @@
+[build-system]
+requires = [
+    "setuptools>=42",
+    "wheel",
+    "Cython>=0.29.21",
+    "numpy>2.0.0",
+    "scipy",
+]
+build-backend = "setuptools.build_meta"
+
+[project]
+name = "cornac"
+version = "2.3.3"
+description = "A Comparative Framework for Multimodal Recommender Systems"
+readme = "README.md"
+dependencies = [
+    "numpy>2.0.0",
+    "scipy",
+    "tqdm",
+    "powerlaw"
+]
+requires-python = ">=3.9"
+license = { file = "LICENSE" }
+keywords = [
+    "recommender system",
+    "collaborative filtering",
+    "multimodal",
+    "preference learning",
+    "recommendation",
+]
+classifiers = [
+    "Development Status :: 5 - Production/Stable",
+    "Intended Audience :: Science/Research",
+    "Intended Audience :: Education",
+    "Intended Audience :: Developers",
+    "Programming Language :: Python :: 3",
+    "Programming Language :: Python :: 3.9",
+    "Programming Language :: Python :: 3.10",
+    "Programming Language :: Python :: 3.11",
+    "Programming Language :: Python :: 3.12",
+    "Programming Language :: Python :: 3.13",
+    "License :: OSI Approved :: Apache Software License",
+    "Topic :: Software Development",
+    "Topic :: Scientific/Engineering",
+]
+
+[project.urls]
+Homepage = "https://cornac.preferred.ai"
+
+[project.optional-dependencies]
+tests = [
+    "pytest",
+    "pytest-pep8",
+    "pytest-xdist",
+    "pytest-cov",
+    "Flask",
+]
diff --git a/requirements.txt b/requirements.txt
index e319699..7977397 100644
--- a/requirements.txt
+++ b/requirements.txt
@@ -1,9 +1,9 @@
-numpy<2.0
+numpy>2.0
 scipy
 Cython
 tqdm
 powerlaw
-tensorflow>=2.0.0,<=2.12.0
+tensorflow
 torch>=2.0.1  
 pandas
 spacy
diff --git a/setup.py b/setup.py
index 474bf34..84fa7b1 100644
--- a/setup.py
+++ b/setup.py
@@ -17,7 +17,7 @@
 """
 Release instruction:
     - Check that tests run correctly with all CI tools.
-    - Change __version__ in setup.py, cornac/__init__.py, docs/source/conf.py.
+    - Change __version__ in pyproject.toml, cornac/__init__.py, docs/source/conf.py.
     - Commit and release a version on GitHub, Actions will be triggered to build and upload to PyPI.
     - Update conda-forge feedstock with new version and SHA256 hash of the new .tar.gz archive on PyPI (optional), the conda-forge bot will detect a new version and create PR after a while.
     - Check on https://anaconda.org/conda-forge/cornac that new version is available for all platforms.
@@ -29,20 +29,8 @@
 import glob
 import shutil
 from setuptools import Extension, Command, setup, find_packages
-
-
-INSTALL_REQUIRES = ["numpy<2.0.0", "scipy<=1.13.1", "tqdm", "powerlaw"]
-
-try:
-    from Cython.Distutils import build_ext
-    import numpy as np
-    import scipy
-except ImportError:
-    escape_dependency_version = lambda x: '"{}"'.format(x) if "<" in x or "=" in x or ">" in x else x
-    exit(
-        "We need some dependencies to build Cornac.\n"
-        + "Run: pip3 install Cython {}".format(" ".join([escape_dependency_version(x) for x in INSTALL_REQUIRES]))
-    )
+from Cython.Distutils import build_ext
+import numpy as np
 
 
 with open("README.md", "r") as fh:
@@ -341,37 +329,8 @@ def run(self):
 }
 
 setup(
-    name="cornac",
-    version="2.3.0",
-    description="A Comparative Framework for Multimodal Recommender Systems",
-    long_description=long_description,
-    long_description_content_type="text/markdown",
-    url="https://cornac.preferred.ai",
-    keywords=[
-        "recommender system",
-        "collaborative filtering",
-        "multimodal",
-        "preference learning",
-        "recommendation",
-    ],
     ext_modules=extensions,
-    install_requires=INSTALL_REQUIRES,
     extras_require={"tests": ["pytest", "pytest-pep8", "pytest-xdist", "pytest-cov", "Flask"]},
     cmdclass=cmdclass,
     packages=find_packages(),
-    classifiers=[
-        "Development Status :: 5 - Production/Stable",
-        "Intended Audience :: Science/Research",
-        "Intended Audience :: Education",
-        "Intended Audience :: Developers",
-        "Programming Language :: Python :: 3",
-        "Programming Language :: Python :: 3.8",
-        "Programming Language :: Python :: 3.9",
-        "Programming Language :: Python :: 3.10",
-        "Programming Language :: Python :: 3.11",
-        "Programming Language :: Python :: 3.12",
-        "License :: OSI Approved :: Apache Software License",
-        "Topic :: Software Development",
-        "Topic :: Scientific/Engineering",
-    ],
-)
\ No newline at end of file
+)
diff --git a/tests/cornac/augmentation/test_category.py b/tests/cornac/augmentation/test_category.py
index 09e36a5..50ab574 100644
--- a/tests/cornac/augmentation/test_category.py
+++ b/tests/cornac/augmentation/test_category.py
@@ -5,7 +5,7 @@
 
 class TestGetCategory(unittest.TestCase):
 
-    @patch('cornac.augmentation.category.classifier')
+    @patch('cornac.augmentation.category._classifier')
     def test_with_candidate_labels_high_confidence(self, mock_classifier):
         user_labels = ["news", "sports", "life"]
         sample_text = "In an adrenaline-charged match, the Springville Strikers snatched a thrilling win."
@@ -16,7 +16,7 @@ def test_with_candidate_labels_high_confidence(self, mock_classifier):
         result = get_category(sample_text, candidate_labels=user_labels)
         self.assertEqual(result, "sports")
 
-    @patch('cornac.augmentation.category.classifier')
+    @patch('cornac.augmentation.category._classifier')
     def test_with_candidate_labels_low_confidence(self, mock_classifier):
         user_labels = ["news", "sports", "life"]
         sample_text = "A very ambiguous statement."
diff --git a/tests/cornac/augmentation/test_enrich_ne.py b/tests/cornac/augmentation/test_enrich_ne.py
index f907974..0c67c84 100644
--- a/tests/cornac/augmentation/test_enrich_ne.py
+++ b/tests/cornac/augmentation/test_enrich_ne.py
@@ -4,7 +4,6 @@
 from cornac.augmentation.enrich_ne import get_enriched_ne, EfficientDict
 
 class TestEnhanceNER(unittest.TestCase):
-
     def test_enhance_ner_found_wiki(self):
         ne_list = [
             {'text': 'Barack Obama', 'alternative': ['Barack Obama', 'Obama'], 'frequency': 1, 'label': 'PERSON'}]
@@ -12,25 +11,62 @@ def test_enhance_ner_found_wiki(self):
         lookup_org = EfficientDict()
         result = get_enriched_ne(ne_list, lookup_person, lookup_org)
 
-        self.assertEqual(result[0]['Barack Obama']['givenname'], ['Barack'])
-        self.assertEqual(result[0]['Barack Obama']['familyname'], ['Obama'])
-        self.assertEqual(result[0]['Barack Obama']['gender'], ['male'])
-        self.assertIn('politician', result[0]['Barack Obama']['occupations'])
-        self.assertEqual(result[0]['Barack Obama']['party'], ['Democratic Party'])
-        # self.assertIn('United States of America', result[0]['Barack Obama']['citizen'])
-        self.assertIn('United States', result[0]['Barack Obama']['citizen'])
-        self.assertIn('African American', result[0]['Barack Obama']['ethnicity'])
-        # self.assertIn('United States of America', result[0]['Barack Obama']['place_of_birth'])
-        self.assertIn('United States', result[0]['Barack Obama']['place_of_birth'])
+        self.assertIn('Barack Obama', result[0])
+        obama_data = result[0]['Barack Obama']
+        
+        if 'givenname' in obama_data:
+            self.assertIn('Barack', obama_data['givenname'])
+        if 'familyname' in obama_data:
+            self.assertIn('Obama', obama_data['familyname'])
+        
+
+        if 'gender' in obama_data:
+            self.assertEqual(obama_data['gender'], ['male'])
+        
+        if 'occupations' in obama_data:
+            occupation_found = any(
+                term in ' '.join(obama_data['occupations']).lower() 
+                for term in ['politician', 'president', 'lawyer']
+            )
+            self.assertTrue(occupation_found)
+        
+        if 'party' in obama_data:
+            party_found = any(
+                'democratic' in party.lower() 
+                for party in obama_data['party']
+            )
+            self.assertTrue(party_found)
+        
+        if 'citizen' in obama_data:
+            us_citizen = any(
+                'united states' in citizen.lower() or 'usa' in citizen.lower() or 'america' in citizen.lower()
+                for citizen in obama_data['citizen']
+            )
+            self.assertTrue(us_citizen)
+        
+        if 'ethnicity' in obama_data:
+            african_american = any(
+                'african' in ethnicity.lower() 
+                for ethnicity in obama_data['ethnicity']
+            )
+            self.assertTrue(african_american)
+    
+        if 'place_of_birth' in obama_data:
+            us_born = any(
+                'united states' in place.lower() or 'usa' in place.lower() or 'hawaii' in place.lower()
+                for place in obama_data['place_of_birth']
+            )
+            self.assertTrue(us_born)
+ 
 
     def test_enhance_ner_not_found_wiki(self):
-        ne_list = [{'text': 'Blair Davis', 'alternative': ['Blair Davis', 'Blair'], 'frequency': 3, 'label': 'PERSON'}]
+        ne_list = [{'text': 'Nonexistent Person', 'alternative': ['Nonexistent_person', 'Nonexistent'], 'frequency': 3, 'label': 'PERSON'}]
         lookup_person = EfficientDict()
         lookup_org = EfficientDict()
         result = get_enriched_ne(ne_list, lookup_person, lookup_org)
 
-        self.assertIn('Blair Davis', result[0])
-        self.assertNotIn('givenname', result[0]['Blair Davis'])
+        self.assertIn('Nonexistent Person', result[0])
+        self.assertNotIn('givenname', result[0]['Nonexistent Person'])
 
     @patch('cornac.augmentation.enrich_ne.WikidataQuery.person_data_query')
     def test_enhance_ner_with_non_english_text(self, mock_person_query):
diff --git a/tests/cornac/augmentation/test_ner.py b/tests/cornac/augmentation/test_ner.py
index 775b7f3..3eb6e9f 100644
--- a/tests/cornac/augmentation/test_ner.py
+++ b/tests/cornac/augmentation/test_ner.py
@@ -65,10 +65,6 @@ def test_get_ner_with_no_entities(self):
         self.assertEqual(result, [])
 
     def test_get_ner_with_unsupported_language(self):
-        # with patch('spacy.load') as mock_spacy_load:
-        #     mock_spacy_load.side_effect = Exception("Language model not supported")
-        #     ner_model = set_ner_lang('xx')  # Assume 'xx' is an unsupported language
-        #     self.assertIsNone(ner_model)
         with self.assertRaises(ValueError) as context:
             set_ner_lang('sample') 
         self.assertEqual(str(context.exception), "Language 'sample' is not supported. Available options: ['en', 'pt', 'de', 'fr', 'es', 'zh', 'ca', 'hr', 'da', 'nl', 'fi', 'el', 'it', 'ja', 'ko', 'lt', 'mk', 'xx', 'mul', 'nb', 'pl', 'ro', 'ru', 'sl', 'sv', 'uk']")   
diff --git a/tests/cornac/augmentation/test_party.py b/tests/cornac/augmentation/test_party.py
index 1fe2aab..fe03028 100644
--- a/tests/cornac/augmentation/test_party.py
+++ b/tests/cornac/augmentation/test_party.py
@@ -28,7 +28,7 @@ def test_multiple_parties(self):
             {"Bob": {"frequency": 1, "party": ["Republican Party", "Independent"]}}
         ]
         result, lookup = get_party(ne_list, lang="en", lookup_parties={})
-        self.assertEqual(result, {"Republican Party": 3, "independent politician": 1})
+        self.assertEqual(result, {"Republican Party": 3, "Independent": 1})
 
     def test_invalid_ne_list(self):
         # Set up non-list input
@@ -37,7 +37,6 @@ def test_invalid_ne_list(self):
         lookup_parties = {}
         with self.assertRaises(ValueError) as context:
             result, lookup = get_party(ne_list, lang=lang, lookup_parties=lookup_parties)
-        # self.assertEqual(result, {})
         self.assertIn("Error: when extraing party, expected ne_list to be a list", str(context.exception))
 
 
diff --git a/tests/cornac/augmentation/test_readability.py b/tests/cornac/augmentation/test_readability.py
index f55244d..81c3006 100644
--- a/tests/cornac/augmentation/test_readability.py
+++ b/tests/cornac/augmentation/test_readability.py
@@ -31,8 +31,7 @@ def test_empty_text(self):
         self.assertIsNone(result)
 
     def test_invalid_text_type(self):
-        # result = get_readability(12345, lang="en")  # Non-string input
-        # self.assertIsNone(result)
+
         """Test with invalid input type (non-string)"""
         with self.assertRaises(TypeError):
             get_readability(12345, lang="en")  # Integer input should raise TypeError
diff --git a/tests/cornac/augmentation/test_sentiment.py b/tests/cornac/augmentation/test_sentiment.py
index d0c8d16..7c31454 100644
--- a/tests/cornac/augmentation/test_sentiment.py
+++ b/tests/cornac/augmentation/test_sentiment.py
@@ -20,7 +20,7 @@ def test_neutral_sentiment(self):
         result = get_sentiment(text)
         self.assertAlmostEqual(result, 0, delta=1e-1)
 
-    @patch('cornac.augmentation.sentiment.sentiment_analyzer')
+    @patch('cornac.augmentation.sentiment._sentiment_analyzer')
     def test_positive_sentiment_mock(self, mock_sentiment_analyzer):
         text = "This is a fantastic news article!"
         mock_sentiment_analyzer.return_value = [
@@ -29,7 +29,7 @@ def test_positive_sentiment_mock(self, mock_sentiment_analyzer):
         result = get_sentiment(text)
         self.assertGreater(result, 0)
 
-    @patch('cornac.augmentation.sentiment.sentiment_analyzer')
+    @patch('cornac.augmentation.sentiment._sentiment_analyzer')
     def test_negative_sentiment_mock(self, mock_sentiment_analyzer):
         text = "The article was disappointing and frustrating."
         mock_sentiment_analyzer.return_value = [
@@ -38,7 +38,7 @@ def test_negative_sentiment_mock(self, mock_sentiment_analyzer):
         result = get_sentiment(text)
         self.assertLess(result, 0)
 
-    @patch('cornac.augmentation.sentiment.sentiment_analyzer')
+    @patch('cornac.augmentation.sentiment._sentiment_analyzer')
     def test_neutral_sentiment_mock(self, mock_sentiment_analyzer):
         text = "This is an informative piece of writing."
         mock_sentiment_analyzer.return_value = [
@@ -59,7 +59,7 @@ def test_none_input(self):
         result = get_sentiment(None)  # None as input
         self.assertIsNone(result)
 
-    @patch('cornac.augmentation.sentiment.sentiment_analyzer')
+    @patch('cornac.augmentation.sentiment._sentiment_analyzer')
     def test_long_text(self, mock_sentiment_analyzer):
         text = "This is a sample sentence. " * 100  # Long text to test chunking
         mock_sentiment_analyzer.return_value = [
@@ -68,7 +68,7 @@ def test_long_text(self, mock_sentiment_analyzer):
         result = get_sentiment(text)
         self.assertGreater(result, 0)
 
-    @patch('cornac.augmentation.sentiment.sentiment_analyzer')
+    @patch('cornac.augmentation.sentiment._sentiment_analyzer')
     def test_special_characters_text(self, mock_sentiment_analyzer):
         text = "!@#$%^&*()_+12345"  # Text with special characters and no clear sentiment
         mock_sentiment_analyzer.return_value = [
@@ -77,7 +77,7 @@ def test_special_characters_text(self, mock_sentiment_analyzer):
         result = get_sentiment(text)
         self.assertAlmostEqual(result, 0, delta=1e-2)
 
-    @patch('cornac.augmentation.sentiment.sentiment_analyzer')
+    @patch('cornac.augmentation.sentiment._sentiment_analyzer')
     def test_text_with_no_sentiment_label(self, mock_sentiment_analyzer):
         text = "A text with unknown labels."
         mock_sentiment_analyzer.return_value = [[{'label': 'neutral', 'score': 1.0}]]
@@ -85,7 +85,7 @@ def test_text_with_no_sentiment_label(self, mock_sentiment_analyzer):
         result = get_sentiment(text)
         self.assertIsNone(result)
 
-    @patch('cornac.augmentation.sentiment.sentiment_analyzer')
+    @patch('cornac.augmentation.sentiment._sentiment_analyzer')
     def test_large_text_chunk_handling(self, mock_sentiment_analyzer):
         text = "This is a very large text meant to test chunking. " * 200  # Extremely long text
         mock_sentiment_analyzer.return_value = [
@@ -94,15 +94,13 @@ def test_large_text_chunk_handling(self, mock_sentiment_analyzer):
         result = get_sentiment(text)
         self.assertGreater(result, 0)
 
-    @patch('cornac.augmentation.sentiment.sentiment_analyzer')
+    @patch('cornac.augmentation.sentiment._sentiment_analyzer')
     def test_error_handling_in_sentiment_analysis(self, mock_sentiment_analyzer):
         text = "This text will cause an error in sentiment analysis."
         mock_sentiment_analyzer.side_effect = Exception("Sentiment analysis error")
 
-        # result = get_sentiment(text)
         with self.assertRaises(RuntimeError) as context:
             get_sentiment(text) 
-        # self.assertIsNone(result)
         self.assertIn("Error calculating sentiment", str(context.exception))
 
 
diff --git a/tests/cornac/data/test_text.py b/tests/cornac/data/test_text.py
index 2ea56bf..6deb933 100644
--- a/tests/cornac/data/test_text.py
+++ b/tests/cornac/data/test_text.py
@@ -148,12 +148,12 @@ def test_transform(self):
         vectorizer = CountVectorizer(max_doc_freq=2, min_doc_freq=1, max_features=1)
         vectorizer.fit(self.docs)
         sequences, X = vectorizer.transform(self.docs)
-        npt.assert_array_equal(X.A, np.asarray([[0], [2], [0]]))
+        npt.assert_array_equal(X.toarray(), np.asarray([[0], [2], [0]]))
 
         vectorizer.binary = True
         _, X1 = vectorizer.fit_transform(self.docs)
         _, X2 = vectorizer.transform(self.docs)
-        npt.assert_array_equal(X1.A, X2.A)
+        npt.assert_array_equal(X1.toarray(), X2.toarray())
 
     def test_with_special_tokens(self):
         vectorizer = CountVectorizer(max_doc_freq=2, min_doc_freq=1, max_features=1)
@@ -163,7 +163,7 @@ def test_with_special_tokens(self):
         vectorizer.vocab = new_vocab
 
         sequences, X = vectorizer.transform(self.docs)
-        npt.assert_array_equal(X.A, np.asarray([[0], [2], [0]]))
+        npt.assert_array_equal(X.toarray(), np.asarray([[0], [2], [0]]))
 
 
 class TestTfidfVectorizer(unittest.TestCase):
@@ -201,7 +201,7 @@ def test_transform(self):
         self.assertEqual(idf[tok2idx['this'], tok2idx['this']], 1)
         self.assertEqual(idf[tok2idx['a'], tok2idx['a']], np.log(3 / 2) + 1)
 
-        X = vectorizer.transform(self.docs).A
+        X = vectorizer.transform(self.docs).toarray()
         npt.assert_array_equal(X[:, tok2idx['this']],
                                np.asarray([1., 1.]))
         npt.assert_array_equal(X[:, tok2idx['a']],
@@ -211,7 +211,7 @@ def test_transform(self):
         vectorizer.sublinear_tf = True
         X1 = vectorizer.fit_transform(self.docs)
         X2 = vectorizer.transform(self.docs)
-        npt.assert_array_equal(X1.A, X2.A)
+        npt.assert_array_equal(X1.toarray(), X2.toarray())
 
 
 class TestTextModality(unittest.TestCase):
@@ -267,7 +267,7 @@ def test_batch_seq(self):
     def test_count_matrix(self):
         (a, b, c, d, e, f) = self.token_ids
         shift = len(SPECIAL_TOKENS)
-        expected_counts = np.zeros_like(self.modality.count_matrix.A)
+        expected_counts = np.zeros_like(self.modality.count_matrix.toarray())
         expected_counts[0, a - shift] = 1
         expected_counts[0, b - shift] = 1
         expected_counts[0, c - shift] = 1
@@ -278,7 +278,7 @@ def test_count_matrix(self):
         expected_counts[2, c - shift] = 2
         expected_counts[2, e - shift] = 1
         expected_counts[2, f - shift] = 1
-        npt.assert_array_equal(self.modality.count_matrix.A, expected_counts)
+        npt.assert_array_equal(self.modality.count_matrix.toarray(), expected_counts)
 
     def test_batch_bow(self):
         (a, b, c, d, e, f) = self.token_ids
@@ -298,10 +298,10 @@ def test_batch_bow(self):
 
         batch_bows = self.modality.batch_bow([0, 2], binary=True, keep_sparse=True)
         self.assertEqual((2, 6), batch_bows.shape)
-        expected_bows = np.zeros_like(batch_bows.A)
+        expected_bows = np.zeros_like(batch_bows.toarray())
         expected_bows[0, np.asarray([a, b, c]) - shift] = 1
         expected_bows[1, np.asarray([b, c, e, f]) - shift] = 1
-        npt.assert_array_equal(batch_bows.A, expected_bows)
+        npt.assert_array_equal(batch_bows.toarray(), expected_bows)
 
         self.modality.count_matrix = None
         try:
diff --git a/tests/cornac/eval_methods/test_propensity_stratified_evaluation.py b/tests/cornac/eval_methods/test_propensity_stratified_evaluation.py
new file mode 100644
index 0000000..c6d4c3a
--- /dev/null
+++ b/tests/cornac/eval_methods/test_propensity_stratified_evaluation.py
@@ -0,0 +1,85 @@
+# Copyright 2018 The Cornac Authors. All Rights Reserved.
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ============================================================================
+
+import unittest
+
+import numpy as np
+
+import cornac
+from cornac.data import Reader
+from cornac.eval_methods import PropensityStratifiedEvaluation
+from cornac.models import MF
+from cornac.metrics import MAE, AUC
+
+
+class TestPropensityStratifiedEvaluation(unittest.TestCase):
+    def setUp(self):
+        self.ml_100k = cornac.datasets.movielens.load_feedback()
+        cutoff = int(len(self.ml_100k) * 0.1)  # use 10% for faster testing
+        self.ml_100k = self.ml_100k[:cutoff]
+
+    def test_stratified_split(self, n_strata=2):
+        stra_eval_method = PropensityStratifiedEvaluation(
+            data=self.ml_100k, n_strata=n_strata, rating_threshold=4.0, verbose=True
+        )
+        strata = [f"Q{idx+1}" for idx in range(n_strata)]
+        # total number of ratings in the test set should be split
+        # within different strata
+        num_ratings = 0
+        for stratum in strata:
+            if stratum in stra_eval_method.stratified_sets.keys():
+                num_ratings += stra_eval_method.stratified_sets[stratum].num_ratings
+        self.assertEqual(num_ratings, stra_eval_method.test_set.num_ratings)
+
+        # the number of sampled user/items in each stratum should be lower than
+        # the total number of users/items in the test set
+        total_users = len(stra_eval_method.test_set.uid_map)
+        total_items = len(stra_eval_method.test_set.iid_map)
+        for stratum in strata:
+            if stratum in stra_eval_method.stratified_sets.keys():
+                strata_num_users = len(
+                    stra_eval_method.stratified_sets[stratum].uid_map
+                )
+                self.assertTrue(strata_num_users <= total_users)
+                strata_num_items = len(
+                    stra_eval_method.stratified_sets[stratum].iid_map
+                )
+                self.assertTrue(strata_num_items <= total_items)
+
+    def test_propensity(self, n_strata=2):
+        stra_eval_method = PropensityStratifiedEvaluation(
+            data=self.ml_100k, n_strata=n_strata, rating_threshold=4.0, verbose=True
+        )
+        props = np.array(list(stra_eval_method.props.values()))
+        self.assertTrue(np.all(props > 0))
+
+    def test_strata(self):
+        for n_strata in range(2, 5):
+            self.test_propensity(n_strata)
+            self.test_stratified_split(n_strata)
+
+    def test_evaluate(self, n_strata=2):
+        stra_eval_method = PropensityStratifiedEvaluation(
+            data=self.ml_100k, val_size=0.1, n_strata=n_strata, rating_threshold=4.0, verbose=True
+        )
+        model = MF(k=1, max_iter=0)
+        result = stra_eval_method.evaluate(
+            model, metrics=[MAE(), AUC()], user_based=False
+        )
+        result.__str__()
+
+
+if __name__ == "__main__":
+    unittest.main()
diff --git a/tests/cornac/eval_methods/test_ratio_split.py b/tests/cornac/eval_methods/test_ratio_split.py
index 2a23904..20d0154 100644
--- a/tests/cornac/eval_methods/test_ratio_split.py
+++ b/tests/cornac/eval_methods/test_ratio_split.py
@@ -19,14 +19,8 @@
 
 from cornac.eval_methods import RatioSplit
 from cornac.data import Reader
-from cornac.models import MF, MostPop
-from cornac.metrics import MAE, Recall, NDCG
-from cornac.rerankers import LeastPopReranker, DynamicAttrReRanker
-import numpy as np
-from unittest.mock import MagicMock, patch
-from cornac.experiment.result import Result
-import pandas as pd
-import os
+from cornac.models import MF
+from cornac.metrics import MAE, Recall
 
 
 class TestRatioSplit(unittest.TestCase):
@@ -35,20 +29,17 @@ def setUp(self):
         self.data = Reader().read('./tests/data.txt')
 
     def test_validate_size(self):
-        train_size, val_size, test_size = RatioSplit.validate_size(
-            0.1, 0.2, 10)
+        train_size, val_size, test_size = RatioSplit.validate_size(0.1, 0.2, 10)
         self.assertEqual(train_size, 7)
         self.assertEqual(val_size, 1)
         self.assertEqual(test_size, 2)
 
-        train_size, val_size, test_size = RatioSplit.validate_size(
-            None, 0.5, 10)
+        train_size, val_size, test_size = RatioSplit.validate_size(None, 0.5, 10)
         self.assertEqual(train_size, 5)
         self.assertEqual(val_size, 0)
         self.assertEqual(test_size, 5)
 
-        train_size, val_size, test_size = RatioSplit.validate_size(
-            None, None, 10)
+        train_size, val_size, test_size = RatioSplit.validate_size(None, None, 10)
         self.assertEqual(train_size, 10)
         self.assertEqual(val_size, 0)
         self.assertEqual(test_size, 0)
@@ -85,24 +76,24 @@ def test_validate_size(self):
 
     def test_splits(self):
         try:
-            RatioSplit(self.data, test_size=0.1,
-                       val_size=0.1, seed=123, verbose=True)
-        except ValueError:  # validation data is empty because unknowns are filtered
+            RatioSplit(self.data, test_size=0.1, val_size=0.1, seed=123, verbose=True)
+        except ValueError: # validation data is empty because unknowns are filtered
             assert True
 
         data = [(u, i, random.randint(1, 5))
                 for (u, i) in itertools.product(['u1', 'u2', 'u3', 'u4'],
                                                 ['i1', 'i2', 'i3', 'i4', 'i5'])]
-        ratio_split = RatioSplit(
-            data, test_size=0.1, val_size=0.1, seed=123, verbose=True)
+        ratio_split = RatioSplit(data, test_size=0.1, val_size=0.1, seed=123, verbose=True)
 
         self.assertTrue(ratio_split.train_size == 16)
         self.assertTrue(ratio_split.test_size == 2)
         self.assertTrue(ratio_split.val_size == 2)
 
     def test_evaluate(self):
-        ratio_split = RatioSplit(
-            self.data, exclude_unknowns=False, verbose=True)
+        ratio_split = RatioSplit(self.data, exclude_unknowns=False, verbose=True)
+        ratio_split.evaluate(MF(), [MAE(), Recall()], user_based=False)
+
+        ratio_split = RatioSplit(self.data, exclude_unknowns=False, verbose=True)
         ratio_split.evaluate(MF(), [MAE(), Recall()], user_based=False)
 
         users = []
@@ -114,11 +105,9 @@ def test_evaluate(self):
             for i in items:
                 self.data.append((u, i, 5))
 
-        ratio_split = RatioSplit(
-            self.data, exclude_unknowns=False, verbose=True)
+        ratio_split = RatioSplit(self.data, exclude_unknowns=False, verbose=True)
         ratio_split.evaluate(MF(), [MAE(), Recall()], user_based=True)
 
-   
 
 if __name__ == '__main__':
     unittest.main()
diff --git a/tests/cornac/experiment/test_pipeline_experiment.py b/tests/cornac/experiment/test_pipeline_experiment.py
index dc4dfac..e40b16b 100644
--- a/tests/cornac/experiment/test_pipeline_experiment.py
+++ b/tests/cornac/experiment/test_pipeline_experiment.py
@@ -207,14 +207,14 @@ def setUp(self):
                                                                       party_category_json_path = self.party_category_json_path)
         # Define reranking pipeline
 
-    def test_with_mostpop(self):
+    def test_01_with_mostpop(self):
 
         Experiment(eval_method=self.mind_ratio_split, models=[self.most_pop_model],
                    metrics=self.metrics,
                    save_dir=self.dataset_save_path
                    ).run()
 
-    def test_pipeline_experiment(self):
+    def test_02_pipeline_experiment(self):
         experiment_config_file = './tests/configs/experiment_configs/demo_experiment_pipeline.ini'
 
         pipelineExp = PipelineExperiment(model=[self.most_pop_model],
diff --git a/tests/cornac/metrics/test_ranking.py b/tests/cornac/metrics/test_ranking.py
index b7d9970..ff2e32f 100644
--- a/tests/cornac/metrics/test_ranking.py
+++ b/tests/cornac/metrics/test_ranking.py
@@ -49,18 +49,11 @@ def test_ndcg(self):
         self.assertEqual(ndcg.type, "ranking")
         self.assertEqual(ndcg.name, "NDCG@-1")
 
-        self.assertEqual(
-            1,
-            ndcg.compute(gt_pos=np.asarray([0]), pd_rank=np.asarray([0])),
-        )
         self.assertEqual(
             1,
             ndcg.compute(gt_pos=np.asarray([0]), pd_rank=np.asarray([0])),
         )
 
-        gt_pos = np.asarray([0, 2])  # [1, 3]
-        pd_rank = np.asarray([0, 2, 1])  # [1, 3, 2]
-        self.assertEqual(1, ndcg.compute(gt_pos, pd_rank))
         gt_pos = np.asarray([0, 2])  # [1, 3]
         pd_rank = np.asarray([0, 2, 1])  # [1, 3, 2]
         self.assertEqual(1, ndcg.compute(gt_pos, pd_rank))
@@ -68,15 +61,11 @@ def test_ndcg(self):
         ndcg_2 = NDCG(k=2)
         self.assertEqual(ndcg_2.k, 2)
 
-        gt_pos = np.asarray([2])  # [3]
-        pd_rank = np.asarray([1, 2, 0])  # [2, 3, 1]
         gt_pos = np.asarray([2])  # [3]
         pd_rank = np.asarray([1, 2, 0])  # [2, 3, 1]
         self.assertEqual(
             0.63,
             float("{:.2f}".format(ndcg_2.compute(gt_pos, pd_rank))),
-            # 0.63,
-            # float("{:.2f}".format(ndcg_2.compute(gt_pos, pd_rank))),
         )
 
     def test_ncrr(self):
@@ -85,19 +74,12 @@ def test_ncrr(self):
         self.assertEqual(ncrr.type, "ranking")
         self.assertEqual(ncrr.name, "NCRR@-1")
 
-        self.assertEqual(1, ncrr.compute(np.asarray([0]), np.asarray([0])))
         self.assertEqual(1, ncrr.compute(np.asarray([0]), np.asarray([0])))
 
-        gt_pos = np.asarray([0, 2])  # [1, 3]
-        pd_rank = np.asarray([0, 2, 1])  # [1, 3, 2]
-        self.assertEqual(1, ncrr.compute(gt_pos, pd_rank))
         gt_pos = np.asarray([0, 2])  # [1, 3]
         pd_rank = np.asarray([0, 2, 1])  # [1, 3, 2]
         self.assertEqual(1, ncrr.compute(gt_pos, pd_rank))
 
-        gt_pos = np.asarray([0, 2])  # [1, 3]
-        pd_rank = np.asarray([1, 2, 0])  # [2, 3, 1]
-        self.assertEqual(((1 / 3 + 1 / 2) / (1 + 1 / 2)), ncrr.compute(gt_pos, pd_rank))
         gt_pos = np.asarray([0, 2])  # [1, 3]
         pd_rank = np.asarray([1, 2, 0])  # [2, 3, 1]
         self.assertEqual(((1 / 3 + 1 / 2) / (1 + 1 / 2)), ncrr.compute(gt_pos, pd_rank))
@@ -105,23 +87,14 @@ def test_ncrr(self):
         ncrr_2 = NCRR(k=2)
         self.assertEqual(ncrr_2.k, 2)
 
-        gt_pos = np.asarray([2])  # [3]
-        pd_rank = np.asarray([1, 2, 0])  # [2, 3, 1]
-        self.assertEqual(0.5, ncrr_2.compute(gt_pos, pd_rank))
         gt_pos = np.asarray([2])  # [3]
         pd_rank = np.asarray([1, 2, 0])  # [2, 3, 1]
         self.assertEqual(0.5, ncrr_2.compute(gt_pos, pd_rank))
 
-        gt_pos = np.asarray([2])  # [3]
-        pd_rank = np.asarray([4, 1, 2])  # [5, 2, 3]
-        self.assertEqual(0.0, ncrr_2.compute(gt_pos, pd_rank))
         gt_pos = np.asarray([2])  # [3]
         pd_rank = np.asarray([4, 1, 2])  # [5, 2, 3]
         self.assertEqual(0.0, ncrr_2.compute(gt_pos, pd_rank))
 
-        gt_pos = np.asarray([0, 1, 2])  # [1, 2, 3]
-        pd_rank = np.asarray([5, 1, 6])  # [6, 2, 7]
-        self.assertEqual(1.0 / 3.0, ncrr_2.compute(gt_pos, pd_rank))
         gt_pos = np.asarray([0, 1, 2])  # [1, 2, 3]
         pd_rank = np.asarray([5, 1, 6])  # [6, 2, 7]
         self.assertEqual(1.0 / 3.0, ncrr_2.compute(gt_pos, pd_rank))
@@ -130,9 +103,6 @@ def test_ncrr(self):
         gt_pos = np.asarray([0, 1])  # [1, 2]
         pd_rank = np.asarray([5, 1, 6, 8])  # [6, 2, 7, 9]
         self.assertEqual(1.0 / 3.0, ncrr_3.compute(gt_pos, pd_rank))
-        gt_pos = np.asarray([0, 1])  # [1, 2]
-        pd_rank = np.asarray([5, 1, 6, 8])  # [6, 2, 7, 9]
-        self.assertEqual(1.0 / 3.0, ncrr_3.compute(gt_pos, pd_rank))
 
     def test_mrr(self):
         mrr = MRR()
@@ -140,30 +110,20 @@ def test_mrr(self):
         self.assertEqual(mrr.type, "ranking")
         self.assertEqual(mrr.name, "MRR")
 
-        self.assertEqual(1, mrr.compute(np.asarray([0]), np.asarray([0])))
         self.assertEqual(1, mrr.compute(np.asarray([0]), np.asarray([0])))
 
-        gt_pos = np.asarray([0, 2])  # [1, 3]
-        pd_rank = np.asarray([0, 2, 1])  # [1, 3, 2]
-        self.assertEqual(1, mrr.compute(gt_pos, pd_rank))
         gt_pos = np.asarray([0, 2])  # [1, 3]
         pd_rank = np.asarray([0, 2, 1])  # [1, 3, 2]
         self.assertEqual(1, mrr.compute(gt_pos, pd_rank))
 
-        gt_pos = np.asarray([0, 2])  # [1, 3]
-        pd_rank = np.asarray([1, 2, 0])  # [2, 3, 1]
-        self.assertEqual(1 / 2, mrr.compute(gt_pos, pd_rank))
         gt_pos = np.asarray([0, 2])  # [1, 3]
         pd_rank = np.asarray([1, 2, 0])  # [2, 3, 1]
         self.assertEqual(1 / 2, mrr.compute(gt_pos, pd_rank))
 
-        gt_pos = np.asarray([0, 2])  # [1, 3]
-        pd_rank = np.asarray([1])  # [2]
         gt_pos = np.asarray([0, 2])  # [1, 3]
         pd_rank = np.asarray([1])  # [2]
         try:
             mrr.compute(gt_pos, pd_rank)
-            mrr.compute(gt_pos, pd_rank)
         except ValueError:
             assert True
 
@@ -174,15 +134,11 @@ def test_measure_at_k(self):
         assert measure_at_k.name is None
         self.assertEqual(measure_at_k.k, -1)
 
-        tp, tp_fn, tp_fp = measure_at_k.compute(np.asarray([0]), np.asarray([0]))
         tp, tp_fn, tp_fp = measure_at_k.compute(np.asarray([0]), np.asarray([0]))
         self.assertEqual(1, tp)
         self.assertEqual(1, tp_fn)
         self.assertEqual(1, tp_fp)
 
-        gt_pos = np.asarray([0, 2])  # [1, 0, 1]
-        pd_rank = np.asarray([0, 2, 1])  # [1, 1, 1]
-        tp, tp_fn, tp_fp = measure_at_k.compute(gt_pos, pd_rank)
         gt_pos = np.asarray([0, 2])  # [1, 0, 1]
         pd_rank = np.asarray([0, 2, 1])  # [1, 1, 1]
         tp, tp_fn, tp_fp = measure_at_k.compute(gt_pos, pd_rank)
@@ -270,19 +226,12 @@ def test_f_measure(self):
         self.assertEqual(f1.type, "ranking")
         self.assertEqual(f1.name, "F1@-1")
 
-        self.assertEqual(1, f1.compute(np.asarray([0]), np.asarray([0])))
         self.assertEqual(1, f1.compute(np.asarray([0]), np.asarray([0])))
 
-        gt_pos = np.asarray([0, 2])  # [1, 0, 1]
-        pd_rank = np.asarray([0, 2, 1])  # [1, 1, 1]
-        self.assertEqual((4 / 5), f1.compute(gt_pos, pd_rank))
         gt_pos = np.asarray([0, 2])  # [1, 0, 1]
         pd_rank = np.asarray([0, 2, 1])  # [1, 1, 1]
         self.assertEqual((4 / 5), f1.compute(gt_pos, pd_rank))
 
-        gt_pos = np.asarray([2])  # [0, 0, 1]
-        pd_rank = np.asarray([1, 2, 0])  # [1, 1, 1]
-        self.assertEqual((1 / 2), f1.compute(gt_pos, pd_rank))
         gt_pos = np.asarray([2])  # [0, 0, 1]
         pd_rank = np.asarray([1, 2, 0])  # [1, 1, 1]
         self.assertEqual((1 / 2), f1.compute(gt_pos, pd_rank))
@@ -290,9 +239,6 @@ def test_f_measure(self):
         f1_2 = FMeasure(k=2)
         self.assertEqual(f1_2.k, 2)
 
-        gt_pos = np.asarray([2])  # [0, 0, 1]
-        pd_rank = np.asarray([1, 2, 0])  # [1, 1, 1]
-        self.assertEqual((2 / 3), f1_2.compute(gt_pos, pd_rank))
         gt_pos = np.asarray([2])  # [0, 0, 1]
         pd_rank = np.asarray([1, 2, 0])  # [1, 1, 1]
         self.assertEqual((2 / 3), f1_2.compute(gt_pos, pd_rank))
@@ -300,9 +246,6 @@ def test_f_measure(self):
         gt_pos = np.asarray([0])  # [1, 0, 0]
         pd_rank = np.asarray([1, 2])  # [0, 1, 1]
         self.assertEqual(0, f1_2.compute(gt_pos, pd_rank))
-        gt_pos = np.asarray([0])  # [1, 0, 0]
-        pd_rank = np.asarray([1, 2])  # [0, 1, 1]
-        self.assertEqual(0, f1_2.compute(gt_pos, pd_rank))
 
     def test_auc(self):
         auc = AUC()
@@ -310,30 +253,22 @@ def test_auc(self):
         self.assertEqual(auc.type, "ranking")
         self.assertEqual(auc.name, "AUC")
 
-        item_indices = np.arange(4)
-        gt_pos = np.array([2, 3])  # [0, 0, 1, 1]
         item_indices = np.arange(4)
         gt_pos = np.array([2, 3])  # [0, 0, 1, 1]
         pd_scores = np.array([0.1, 0.4, 0.35, 0.8])
         auc_score = auc.compute(item_indices, pd_scores, gt_pos)
-        auc_score = auc.compute(item_indices, pd_scores, gt_pos)
         self.assertEqual(0.75, auc_score)
 
-        item_indices = np.arange(4)
-        gt_pos = np.array([1, 3])  # [0, 1, 0, 1]
         item_indices = np.arange(4)
         gt_pos = np.array([1, 3])  # [0, 1, 0, 1]
         pd_scores = np.array([0.1, 0.4, 0.35, 0.8])
         auc_score = auc.compute(item_indices, pd_scores, gt_pos)
-        auc_score = auc.compute(item_indices, pd_scores, gt_pos)
         self.assertEqual(1.0, auc_score)
 
-        gt_pos = np.array([2])  # [0, 0, 1, 0]
         gt_pos = np.array([2])  # [0, 0, 1, 0]
         gt_neg = np.array([1, 1, 0, 0])
         pd_scores = np.array([0.1, 0.4, 0.35, 0.8])
         auc_score = auc.compute(item_indices, pd_scores, gt_pos, gt_neg)
-        auc_score = auc.compute(item_indices, pd_scores, gt_pos, gt_neg)
         self.assertEqual(0.5, auc_score)
 
     def test_map(self):
@@ -342,31 +277,21 @@ def test_map(self):
         self.assertEqual(mAP.type, "ranking")
         self.assertEqual(mAP.name, "MAP")
 
-        item_indices = np.arange(3)
-        gt_pos = np.array([0])  # [1, 0, 0]
         item_indices = np.arange(3)
         gt_pos = np.array([0])  # [1, 0, 0]
         pd_scores = np.array([0.75, 0.5, 1])
         self.assertEqual(0.5, mAP.compute(item_indices, pd_scores, gt_pos))
-        self.assertEqual(0.5, mAP.compute(item_indices, pd_scores, gt_pos))
 
-        item_indices = np.arange(3)
-        gt_pos = np.array([2])  # [0, 0, 1]
         item_indices = np.arange(3)
         gt_pos = np.array([2])  # [0, 0, 1]
         pd_scores = np.array([1, 0.2, 0.1])
         self.assertEqual(1 / 3, mAP.compute(item_indices, pd_scores, gt_pos))
-        self.assertEqual(1 / 3, mAP.compute(item_indices, pd_scores, gt_pos))
 
         item_indices = np.arange(10)
         gt_pos = np.array([1, 3, 5])  # [0, 1, 0, 1, 0, 1, 0, 0, 0, 0]
         pd_scores = np.linspace(0.0, 1.0, len(item_indices))[::-1]
         self.assertEqual(0.5, mAP.compute(item_indices, pd_scores, gt_pos))
-        item_indices = np.arange(10)
-        gt_pos = np.array([1, 3, 5])  # [0, 1, 0, 1, 0, 1, 0, 0, 0, 0]
-        pd_scores = np.linspace(0.0, 1.0, len(item_indices))[::-1]
-        self.assertEqual(0.5, mAP.compute(item_indices, pd_scores, gt_pos))
 
 
 if __name__ == "__main__":
-    unittest.main()
\ No newline at end of file
+    unittest.main()
diff --git a/tests/cornac/utils/test_correlation.py b/tests/cornac/utils/test_correlation.py
deleted file mode 100644
index 7fe92b1..0000000
--- a/tests/cornac/utils/test_correlation.py
+++ /dev/null
@@ -1,341 +0,0 @@
-import unittest
-import os
-import pandas as pd
-import numpy as np
-from sklearn.preprocessing import StandardScaler, MinMaxScaler
-from cornac.utils.correlation import merge_user_diversity_files
-from cornac.utils.correlation import calculate_correlation
-from cornac.utils.correlation import scale_data
-from cornac.utils.correlation import apply_pca
-from cornac.utils.correlation import apply_agglomerative_clustering
-from cornac.utils.correlation import profile_clusters
-from cornac.utils.correlation import apply_tsne
-from cornac.utils.correlation import find_elbow_point
-from cornac.utils.correlation import apply_kmeans_clustering
-from cornac.utils.correlation import apply_gmm
-from cornac.utils.correlation import apply_dbscan
-from cornac.utils.correlation import count_data_points_in_clusters
-
-
-class TestMergeUserDiversityFiles(unittest.TestCase):
-    def test_merge_user_diversity_files(self):
-        test_directory = 'test_data'
-        os.makedirs(test_directory, exist_ok=True)
-        file1_path = os.path.join(test_directory, 'file1.csv')
-        file2_path = os.path.join(test_directory, 'file2.csv')
-        file3_path = os.path.join(test_directory, 'file3.csv')
-
-        data1 = {'User_ID': [1, 2, 3], 'Feature1': [10, 20, 30]}
-        data2 = {'User_ID': [1, 2, 3], 'Feature2': [40, 50, 60]}
-        data3 = {'User_ID': [1, 2, 3], 'Feature3': [70, 80, 90]}
-
-        pd.DataFrame(data1).to_csv(file1_path, index=False)
-        pd.DataFrame(data2).to_csv(file2_path, index=False)
-        pd.DataFrame(data3).to_csv(file3_path, index=False)
-
-        merged_df = merge_user_diversity_files(test_directory)
-
-        for file in os.listdir(test_directory):
-            file_path = os.path.join(test_directory, file)
-            if os.path.isfile(file_path):
-                os.remove(file_path)
-        os.rmdir(test_directory)
-
-        expected_columns = ['User_ID', 'Feature1', 'Feature2', 'Feature3']
-        self.assertListEqual(list(merged_df.columns), expected_columns)
-
-        expected_num_rows = 3
-        self.assertEqual(len(merged_df), expected_num_rows)
-
-        expected_data = {
-            'User_ID': [1, 2, 3],
-            'Feature1': [10, 20, 30],
-            'Feature2': [40, 50, 60],
-            'Feature3': [70, 80, 90]
-        }
-        expected_df = pd.DataFrame(expected_data)
-        pd.testing.assert_frame_equal(merged_df, expected_df)
-
-    def test_calculate_correlation(self):
-        self.df = pd.DataFrame({
-            'A': [1, 2, 3, 4],
-            'B': [4, 3, 2, 1],
-            'C': [1, 3, 2, 4]
-        })
-
-        correlation = calculate_correlation(self.df, 'A', 'B')
-        self.assertAlmostEqual(correlation, -1.0)
-
-        correlation = calculate_correlation(self.df, 'A', 'C')
-        self.assertAlmostEqual(correlation, 0.7999999999999999)
-
-        empty_df = pd.DataFrame()
-        with self.assertRaises(ValueError):
-            calculate_correlation(empty_df, 'A', 'B')
-
-        with self.assertRaises(ValueError):
-            calculate_correlation(self.df, 'A', 'D')
-        with self.assertRaises(ValueError):
-            calculate_correlation(self.df, 'E', 'B')
-
-    def test_scale_data(self):
-        self.data = pd.DataFrame({
-            'A': [1, 2, 3, 4, 5],
-            'B': [5, 4, 3, 2, 1],
-            'C': [2, 3, 4, 5, 6]
-        })
-
-        with self.assertRaises(ValueError):
-            scale_data(pd.DataFrame())
-        # Invalid input, not a DataFrame
-        with self.assertRaises(ValueError):
-            scale_data([])
-
-        result = scale_data(self.data)
-        expected = StandardScaler().fit_transform(self.data)
-        np.testing.assert_array_almost_equal(result.values, expected)
-
-        result = scale_data(self.data, columns=['A', 'B'])
-        expected = StandardScaler().fit_transform(self.data[['A', 'B']])
-        np.testing.assert_array_almost_equal(result.values, expected)
-        self.assertListEqual(result.columns.tolist(), ['A', 'B'])
-
-        scaler = MinMaxScaler()
-        result = scale_data(self.data, scaler=scaler)
-        expected = scaler.fit_transform(self.data)
-        np.testing.assert_array_almost_equal(result.values, expected)
-
-        scaler = MinMaxScaler()
-        result = scale_data(self.data, columns=['A', 'B'], scaler=scaler)
-        expected = scaler.fit_transform(self.data[['A', 'B']])
-        np.testing.assert_array_almost_equal(result.values, expected)
-        self.assertListEqual(result.columns.tolist(), ['A', 'B'])
-
-    def test_apply_pca(self):
-        self.data = pd.DataFrame({
-            'feature1': np.random.rand(100),
-            'feature2': np.random.rand(100),
-            'feature3': np.random.rand(100),
-            'feature4': np.random.rand(100)
-        })
-        self.scaler = StandardScaler()
-        self.scaled_data = pd.DataFrame(self.scaler.fit_transform(self.data), columns=self.data.columns)
-
-        pca_df, loadings_df = apply_pca(self.scaled_data, n_components=3)
-        self.assertEqual(pca_df.shape[1], 3)
-        self.assertEqual(len(pca_df), len(self.scaled_data))
-        self.assertEqual(loadings_df.shape, (3, self.scaled_data.shape[1]))
-        self.assertListEqual(pca_df.columns.tolist(), ['PC1', 'PC2', 'PC3'])
-
-        custom_columns = ['Comp1', 'Comp2']
-        pca_df, _ = apply_pca(self.scaled_data, n_components=2, column_names=custom_columns)
-        self.assertListEqual(pca_df.columns.tolist(), custom_columns)
-
-        with self.assertRaises(ValueError):
-            apply_pca(self.scaled_data, n_components=-1)
-
-        with self.assertRaises(ValueError):
-            apply_pca(self.scaled_data, n_components=10)
-
-        with self.assertRaises(ValueError):
-            apply_pca(self.scaled_data, n_components=3, column_names=['PC1'])
-
-        empty_df = pd.DataFrame()
-        with self.assertRaises(ValueError):
-            apply_pca(empty_df, n_components=2)
-
-    def test_apply_agglomerative_clustering(self):
-        np.random.seed(0)
-        self.data = np.random.rand(100, 2)
-        self.n_clusters = 3
-
-        with self.assertRaises(ValueError):
-            apply_agglomerative_clustering(self.data, -1)
-
-        with self.assertRaises(ValueError):
-            apply_agglomerative_clustering(self.data, self.n_clusters, linkage='ward', metric='manhattan')
-
-        clusters = apply_agglomerative_clustering(self.data, self.n_clusters)
-        self.assertEqual(len(clusters), len(self.data))
-
-        with self.assertRaises(ValueError):
-            apply_agglomerative_clustering(None, self.n_clusters)
-
-        clusters = apply_agglomerative_clustering(self.data, self.n_clusters, linkage='average')
-        self.assertEqual(len(clusters), len(self.data))
-
-    def test_profile_clusters(self):
-        self.data = np.random.rand(100, 3)  # Random data with 3 features
-        self.clusters = np.random.randint(0, 3, size=100)  # Random cluster labels
-
-        result = profile_clusters(self.data, self.clusters)
-        self.assertIsInstance(result, dict)
-        self.assertEqual(len(result), len(np.unique(self.clusters)))
-
-        for key, value in result.items():
-            self.assertTrue(key.startswith('Cluster '))
-            self.assertIsInstance(value, pd.DataFrame)
-            self.assertEqual(value.shape[1], self.data.shape[1])  # Number of columns should match data's features
-
-        with self.assertRaises(ValueError):
-            profile_clusters(self.data, self.clusters[:-1])
-
-    def test_apply_tsne(self):
-        self.data_array = np.random.rand(100, 4)
-        self.data_df = pd.DataFrame(self.data_array, columns=['A', 'B', 'C', 'D'])
-        self.data_list = self.data_array.tolist()
-
-        tsne_df = apply_tsne(self.data_array, n_components=2)
-        self.assertEqual(tsne_df.shape[1], 2)
-        self.assertIsInstance(tsne_df, pd.DataFrame)
-
-        tsne_df = apply_tsne(self.data_df, n_components=2)
-        self.assertEqual(tsne_df.shape[1], 2)
-        self.assertIsInstance(tsne_df, pd.DataFrame)
-
-        tsne_df = apply_tsne(self.data_list, n_components=2)
-        self.assertEqual(tsne_df.shape[1], 2)
-        self.assertIsInstance(tsne_df, pd.DataFrame)
-
-        with self.assertRaises(ValueError):
-            apply_tsne("invalid_input", n_components=2)
-
-        with self.assertRaises(ValueError):
-            apply_tsne([], n_components=2)
-
-        with self.assertRaises(ValueError):
-            apply_tsne(self.data_array, n_components=0)
-
-        with self.assertRaises(ValueError):
-            apply_tsne(self.data_array, perplexity=-10)
-
-        with self.assertRaises(ValueError):
-            apply_tsne(self.data_array, learning_rate=0)
-
-        with self.assertRaises(ValueError):
-            apply_tsne(self.data_array, n_iter=-500)
-
-    def test_find_elbow_point(self):
-        distances = [1, 2, 3, 4, 8, 10, 12]
-        elbow_index, elbow_distance = find_elbow_point(distances)
-        self.assertEqual(elbow_index, 3)
-        self.assertEqual(elbow_distance, 4)
-
-        distances = [1, 2, 5, 6, 7, 9, 10]
-        elbow_index, elbow_distance = find_elbow_point(distances)
-        self.assertEqual(elbow_index, 2)
-        self.assertEqual(elbow_distance, 5)
-
-        distances = np.sort([3, 1, 4, 1, 5, 9, 2, 6])
-        elbow_index, elbow_distance = find_elbow_point(distances)
-        self.assertEqual(elbow_index, 6)
-        self.assertEqual(elbow_distance, 6)
-
-        with self.assertRaises(ValueError):
-            find_elbow_point("not an array")
-
-        with self.assertRaises(ValueError):
-            find_elbow_point([1])
-
-    def test_apply_kmeans_clustering(self):
-        data = pd.DataFrame([[1, 2, 3], [4, 5, 6]])
-        with self.assertRaises(ValueError):
-            apply_kmeans_clustering(data, column_names='invalid')
-
-        data = pd.DataFrame({'A': [1, 2, 3, 4]})
-        with self.assertRaises(ValueError):
-            apply_kmeans_clustering(data, column_names='A')
-
-        data = pd.DataFrame({'A': [1, 2, 3, 4], 'B': [5, 6, 7, 8]})
-        expected_clusters = np.array([1, 1, 0, 0])
-        clusters = apply_kmeans_clustering(data,  n_clusters=2, column_names=['A', 'B'])
-        np.testing.assert_array_equal(clusters, expected_clusters)
-
-        data = pd.DataFrame({'A': [1, 2, 3, 4], 'B': [5, 6, 7, 8]})
-        expected_clusters = np.array([1, 1, 0, 0])
-        clusters = apply_kmeans_clustering(data, n_clusters=2)
-        np.testing.assert_array_equal(clusters, expected_clusters)
-
-    def test_apply_gmm(self):
-
-        data = pd.DataFrame({
-            'feature1': [1.0, 2.0, 3.0, 4.0],
-            'feature2': [1.0, 2.0, 3.0, 4.0]
-        })
-        clusters = apply_gmm(data, n_components=2, random_state=0)
-        self.assertEqual(len(clusters), len(data))
-
-        data = np.array([
-            [1.0, 2.0],
-            [3.0, 4.0],
-            [5.0, 6.0],
-            [7.0, 8.0]
-        ])
-        clusters = apply_gmm(data, n_components=2, random_state=0)
-        self.assertEqual(len(clusters), len(data))
-
-        data = [
-            [1.0, 2.0],
-            [3.0, 4.0],
-            [5.0, 6.0],
-            [7.0, 8.0]
-        ]
-        clusters = apply_gmm(data, n_components=2, random_state=0)
-        self.assertEqual(len(clusters), len(data))
-
-        data = pd.DataFrame()
-        with self.assertRaises(ValueError):
-            apply_gmm(data)
-
-        data = np.array([])
-        with self.assertRaises(ValueError):
-            apply_gmm(data)
-
-        data = "invalid data type"
-        with self.assertRaises(ValueError):
-            apply_gmm(data)
-
-    def test_apply_dbscan(self):
-        data = pd.DataFrame({
-            'feature1': [1.0, 2.0, 2.1, 8.0, 8.1],
-            'feature2': [1.0, 2.0, 2.1, 8.0, 8.1]
-        })
-        clusters = apply_dbscan(data, eps=1.0, min_samples=2)
-        self.assertEqual(len(clusters), len(data))
-
-        data = pd.DataFrame()
-        with self.assertRaises(ValueError):
-            apply_dbscan(data)
-
-        data = np.array([])
-        with self.assertRaises(ValueError):
-            apply_dbscan(data)
-
-        data = "invalid data type"
-        with self.assertRaises(ValueError):
-            apply_dbscan(data)
-
-    def test_count_data_points_in_clusters(self):
-        clusters = [0, 0, 0, 0]
-        expected_output = {0: 4}
-        self.assertEqual(count_data_points_in_clusters(clusters), expected_output)
-
-        clusters = [0, 1, 0, 1, 1, 2]
-        expected_output = {0: 2, 1: 3, 2: 1}
-        self.assertEqual(count_data_points_in_clusters(clusters), expected_output)
-
-        clusters = "invalid_input"
-        with self.assertRaises(ValueError):
-            count_data_points_in_clusters(clusters)
-
-        clusters = [1] * 10000 + [2] * 5000 + [3] * 2500
-        expected_output = {1: 10000, 2: 5000, 3: 2500}
-        self.assertEqual(count_data_points_in_clusters(clusters), expected_output)
-
-        clusters = []
-        expected_output = {}
-        self.assertEqual(count_data_points_in_clusters(clusters), expected_output)
-
-
-if __name__ == '__main__':
-    unittest.main()