feat: feat

DiogoRibeiro7 · DiogoRibeiro7 · commit 275dac73fd48 · 2024-10-19T17:56:48.000+01:00
diff --git a/_posts/2020-01-07-how_big_data_transforming_predictive_maintenance.md b/_posts/2020-01-07-how_big_data_transforming_predictive_maintenance.md
@@ -56,7 +56,7 @@ title: How Big Data is Transforming Predictive Maintenance
 ---
 author_profile: false
 categories:
-- Big Data
+- Data Science
 classes: wide
 date: '2020-01-07'
 excerpt: Big Data is revolutionizing predictive maintenance by offering unprecedented
diff --git a/_posts/2021-06-01-customer_segmentation.md b/_posts/2021-06-01-customer_segmentation.md
@@ -15,7 +15,7 @@ header:
   teaser: /assets/images/data_science_9.jpg
   twitter_image: /assets/images/data_science_1.jpg
 keywords:
-- Customer Analytics
+- Customer analytics
 - Customer segmentation
 - Unsupervised learning
 - Data science
diff --git a/_posts/2024-07-31-Custom_libraries.md b/_posts/2024-07-31-Custom_libraries.md
@@ -1,33 +1,36 @@
 ---
-title: 'Building Custom Python Libraries for Your Industry Needs'
+author_profile: false
 categories:
 - Python
-tags:
-- Python libraries
-- Custom software
-- Industry solutions
-- Software development
-- Automation
-- Python
-author_profile: false
+classes: wide
 date: '2024-07-31'
+excerpt: A guide on developing custom Python libraries to meet specific industry needs, focusing on software development and automation.
 header:
   image: /assets/images/data_science_4.jpg
   og_image: /assets/images/data_science_5.jpg
   overlay_image: /assets/images/data_science_4.jpg
   show_overlay_excerpt: false
   teaser: /assets/images/data_science_4.jpg
   twitter_image: /assets/images/data_science_5.jpg
-seo_title: 'Building Custom Python Libraries for Industry-Specific Solutions'
-seo_description: 'Learn how to create custom Python libraries tailored to your industry needs. This article covers strategies for software development and automation using Python.'
-excerpt: 'A guide on developing custom Python libraries to meet specific industry needs, focusing on software development and automation.'
-summary: 'This article explores the process of building custom Python libraries, offering insights into Python’s versatility for developing industry-specific software solutions and automation tools.'
-keywords: 
+keywords:
 - Python libraries
 - Custom software development
 - Automation
 - Industry solutions
-classes: wide
+- python
+seo_description: Learn how to create custom Python libraries tailored to your industry needs. This article covers strategies for software development and automation using Python.
+seo_title: Building Custom Python Libraries for Industry-Specific Solutions
+seo_type: article
+summary: This article explores the process of building custom Python libraries, offering insights into Python’s versatility for developing industry-specific software solutions and automation tools.
+tags:
+- Python libraries
+- Custom software
+- Industry solutions
+- Software development
+- Automation
+- Python
+- python
+title: Building Custom Python Libraries for Your Industry Needs
 ---
 
 ## Overview
diff --git a/_posts/2024-09-12-importance_sampling.md b/_posts/2024-09-12-importance_sampling.md
@@ -55,8 +55,7 @@ Estimating credit risk in portfolios containing loans or bonds is crucial for fi
 ---
 author_profile: false
 categories:
-- Finance
-- Risk Management
+- Statistics
 classes: wide
 date: '2024-09-12'
 excerpt: Importance Sampling offers an efficient alternative to traditional Monte
@@ -122,8 +121,7 @@ In this model, each obligor’s default is influenced by a set of **systematic f
 ---
 author_profile: false
 categories:
-- Finance
-- Risk Management
+- Statistics
 classes: wide
 date: '2024-09-12'
 excerpt: Importance Sampling offers an efficient alternative to traditional Monte
@@ -201,8 +199,7 @@ When obligors are dependent (i.e., influenced by common risk factors), IS become
 ---
 author_profile: false
 categories:
-- Finance
-- Risk Management
+- Statistics
 classes: wide
 date: '2024-09-12'
 excerpt: Importance Sampling offers an efficient alternative to traditional Monte
diff --git a/_posts/2024-09-17-ml_healthcare.md b/_posts/2024-09-17-ml_healthcare.md
@@ -22,7 +22,6 @@ keywords:
 - Personalized medicine
 - Predictive analytics
 - Healthcare
-- Machine Learning
 - Healthcare data privacy
 - Clinical implementation challenges
 - Predictive patient outcomes
diff --git a/capitalized_keywords.py b/capitalized_keywords.py
@@ -0,0 +1,73 @@
+import os
+import yaml
+import re
+
+# Define the folder where the markdown files are stored
+folder_path = './_posts'  # Change this to your folder path
+
+# List of stop words to exclude from capitalization
+stop_words = {'at', 'vs', 'and', 'or', 'the', 'of', 'in', 'on', 'for', 'to', 'a'}
+
+# Function to capitalize keywords based on your rules
+def capitalize_keywords(keywords):
+    def capitalize_word(word, first_word=False):
+        # Only capitalize if it's not a stop word or it's the first word
+        if word in stop_words and not first_word:
+            return word
+        else:
+            return word.capitalize()
+
+    def process_phrase(phrase):
+        words = phrase.split()
+        # Capitalize each word as per rules, first word always capitalized
+        return ' '.join(capitalize_word(word, i == 0) for i, word in enumerate(words))
+
+    return [process_phrase(phrase) for phrase in keywords]
+
+# Function to process each markdown file
+def process_markdown_file(file_path):
+    with open(file_path, 'r', encoding='utf-8') as file:
+        content = file.read()
+
+    # Use regex to extract the front matter (between '---' lines)
+    front_matter_match = re.match(r'---(.*?)---', content, re.DOTALL)
+    if not front_matter_match:
+        print(f"No front matter found in {file_path}")
+        return
+
+    front_matter = front_matter_match.group(1)
+    
+    # Parse the front matter using YAML
+    try:
+        front_matter_dict = yaml.safe_load(front_matter)
+    except yaml.YAMLError as exc:
+        print(f"Error parsing YAML in {file_path}: {exc}")
+        return
+    
+    # If 'keywords' exists in front matter, process it
+    if 'keywords' in front_matter_dict:
+        original_keywords = front_matter_dict['keywords']
+        updated_keywords = capitalize_keywords(original_keywords)
+        front_matter_dict['keywords'] = updated_keywords
+
+        # Replace the front matter in the content
+        updated_front_matter = yaml.dump(front_matter_dict, default_flow_style=False)
+        updated_content = re.sub(r'---(.*?)---', f'---\n{updated_front_matter}---', content, flags=re.DOTALL)
+
+        # Save the updated content back to the file
+        with open(file_path, 'w', encoding='utf-8') as file:
+            file.write(updated_content)
+        
+        print(f"Updated keywords in {file_path}")
+    else:
+        print(f"No 'keywords' found in {file_path}")
+
+# Function to process all markdown files in the folder
+def process_all_markdown_files(folder_path):
+    for filename in os.listdir(folder_path):
+        if filename.endswith(".md"):  # Check if it's a markdown file
+            file_path = os.path.join(folder_path, filename)
+            process_markdown_file(file_path)
+
+# Run the function for the specified folder
+process_all_markdown_files(folder_path)