diff --git a/Beta-L/Influencer_dashboard_design/amazonbar.png b/Beta-L/Influencer_dashboard_design/amazonbar.png
new file mode 100644
index 0000000..1f7c1d9
Binary files /dev/null and b/Beta-L/Influencer_dashboard_design/amazonbar.png differ
diff --git a/Beta-L/Influencer_dashboard_design/app.py b/Beta-L/Influencer_dashboard_design/app.py
new file mode 100644
index 0000000..dfb4c33
--- /dev/null
+++ b/Beta-L/Influencer_dashboard_design/app.py
@@ -0,0 +1,257 @@
+from flask import Flask, render_template, request, redirect, url_for
+import plotly.express as px
+import pandas as pd
+import mysql.connector
+
+app = Flask(__name__)
+
+
+# MySQL database connection parameters
+db_params = {
+    "host": "sebi-hackathon.mysql.database.azure.com",
+    "user": "mysql",
+    "password": "Betateam-L",
+    "database": "fintech-influencers-claims"
+}
+
+# Create a MySQL database connection
+db_connection = mysql.connector.connect(**db_params)
+db_cursor = db_connection.cursor()
+
+# Fetch data from the table
+query = "SELECT * FROM fintech_influencers"
+db_cursor.execute(query)
+result = db_cursor.fetchall()
+
+# Define column names
+columns = [desc[0] for desc in db_cursor.description]
+
+# Create a DataFrame from the fetched data
+df = pd.DataFrame(result, columns=columns)
+
+# Load your dataset (replace 'your_dataset.csv' with your actual dataset file)
+#df = pd.read_excel('indummm.xlsx')
+
+df['Flagged Claims'] = ''
+
+# Dictionary to store previous feedback
+previous_feedback = {}
+previous_ratings = {}
+
+@app.route('/')
+def index():
+    filtered_data = df  # Initialize with all data
+
+    keywords = request.args.get('keywords', '').split(',')
+    filter_option = request.args.get('filter', 'both')  # Default to 'all' filter
+
+    # Apply filters based on the selected filter option
+    if filter_option == 'claims':
+        filtered_data = df[df['Claim'].str.contains('|'.join(keywords))]
+    elif filter_option == 'influencers':
+        filtered_data = df[df['Name'].str.contains('|'.join(keywords))]
+
+    elif filter_option == 'keywords':
+        filtered_data = df[df['Keywords'].str.contains('|'.join(keywords))]
+    
+    elif filter_option == 'both':
+        filtered_data = df[
+            (df['Claim'].str.contains('|'.join(keywords))) |
+            (df['Name'].str.contains('|'.join(keywords))) | 
+            (df['Keywords'].str.contains('|'.join(keywords)))
+        ]
+
+    sorted_data = sorted(filtered_data.to_dict('records'), key=lambda x: x['Credibility_Score'], reverse=True)
+    cards_per_row = 3
+    rows = [sorted_data[i:i+cards_per_row] for i in range(0, len(sorted_data), cards_per_row)]
+    return render_template('index.html', rows=rows)
+
+
+
+@app.route('/profile/<string:influencer_name>')
+def profile(influencer_name):
+    filtered_data = df[df['Name'] == influencer_name]
+    
+    if not filtered_data.empty:
+        influencer = filtered_data.iloc[0]
+        influencer_name = influencer['Name']
+        influencer_previous_feedback = previous_feedback.get(influencer_name, [])
+        influencer_previous_ratings = previous_ratings.get(influencer_name, [])
+        
+        return render_template(
+            'profile.html',
+            influencer=influencer,
+            previous_feedback=influencer_previous_feedback,
+            previous_ratings=influencer_previous_ratings
+        )
+    else:
+        return "Influencer not found."
+
+
+@app.route('/visualize')
+def visualize():
+    return render_template('visualize.html')
+
+@app.route('/visualize/credibility_bar')
+def visualize_credential_bar():
+    fig = px.bar(df, x='Name', y='Credibility_Score', title='Credibility Score Distribution')
+    return fig.to_html()
+
+@app.route('/visualize/claim_pie')
+def visualize_claim_pie():
+    claim_counts = df['Claim'].value_counts()
+    fig = px.pie(claim_counts, names=claim_counts.index, values=claim_counts.values, title='Pie Chart for Claim Categories')
+    return fig.to_html()
+
+@app.route('/flag/<int:index>')
+def flag(index):
+    df.at[index, 'Flagged'] = True  # Assuming you have a 'Flagged' column in your DataFrame
+    return redirect(url_for('index'))
+
+@app.route('/feedback/<string:influencer_name>', methods=['GET', 'POST'])
+def feedback(influencer_name):
+    influencer = df[df['Name'] == influencer_name].iloc[0]
+
+    if request.method == 'POST':
+        feedback = request.form.get('feedback')
+
+        # Store previous feedback in the dictionary
+        if influencer_name in previous_feedback:
+            previous_feedback[influencer_name].append(feedback)
+        else:
+            previous_feedback[influencer_name] = [feedback]
+
+        # Update the DataFrame with the latest feedback
+        influencer_index = influencer.index[0]  # Get the index of the influencer
+        df.at[influencer_index, 'Feedback'] = feedback
+
+        return redirect(url_for('profile', influencer_name=influencer_name))
+
+    influencer_previous_feedback = previous_feedback.get(influencer_name, [])
+    
+    return render_template('feedback_form.html', influencer=influencer, previous_feedback=influencer_previous_feedback)
+
+
+
+@app.route('/flag_claim/<string:influencer_name>/<string:claim>', methods=['POST'])
+def flag_claim(influencer_name, claim):
+    influencer = df[df['Name'] == influencer_name].iloc[0]
+
+    if not isinstance(influencer['Flagged Claims'], list):
+        influencer['Flagged Claims'] = []
+
+    if claim not in influencer['Flagged Claims']:
+        influencer['Flagged Claims'].append(claim)
+    
+    # You can perform other flagging actions here if needed
+    # For example, you might want to update a database or a log
+    
+    return redirect(url_for('profile', influencer_name=influencer_name))
+
+
+
+
+
+
+
+
+@app.route('/rate/<string:influencer_name>', methods=['GET', 'POST'])
+def rate(influencer_name):
+    influencer = df[df['Name'] == influencer_name].iloc[0]
+
+    if request.method == 'POST':
+        rating = int(request.form.get('rating'))
+
+        # Store previous ratings in the dictionary
+        if influencer_name in previous_ratings:
+            previous_ratings[influencer_name].append(rating)
+        else:
+            previous_ratings[influencer_name] = [rating]
+
+        # Update the DataFrame with the latest rating
+        influencer_index = influencer.index[0]  # Get the index of the influencer
+        df.at[influencer_index, 'Rating'] = rating
+        return redirect(url_for('profile', influencer_name=influencer_name))
+
+    influencer_previous_ratings = previous_ratings.get(influencer_name, [])
+
+    return render_template('rating_form.html', influencer=influencer, previous_ratings=influencer_previous_ratings)
+
+
+@app.route('/compare', methods=['GET', 'POST'])
+def compare():
+    influencers_list = df['Name'].tolist()
+
+    if request.method == 'POST':
+        selected_influencers = request.form.getlist('influencers')
+
+        if len(selected_influencers) <= 3:
+            selected_data = df[df['Name'].isin(selected_influencers)]
+
+            # Create the Credibility Score graph
+            credibility_graph = px.bar(selected_data, x='Name', y='Credibility_Score', title='Comparison of Credibility Scores')
+
+            # Create the Rating graph
+            rating_graph = px.bar(selected_data, x='Name', y='Rating', title='Comparison of Ratings')
+
+            # Convert graphs to HTML
+            credibility_graph = credibility_graph.to_html(full_html=False, include_plotlyjs='cdn')
+            rating_graph = rating_graph.to_html(full_html=False, include_plotlyjs='cdn')
+
+            return render_template(
+                'compare.html',
+                influencers=influencers_list,
+                credibility_graph=credibility_graph,
+                rating_graph=rating_graph
+            )
+
+        else:
+            return "Please select up to 3 influencers for comparison."
+
+    return render_template('compare.html', influencers=influencers_list, credibility_graph='', rating_graph='')
+
+"""def compare():
+    df = pd.DataFrame(result, columns=columns)
+    influencers_list = df['Name'].tolist()
+
+    if request.method == 'POST':
+        selected_influencers = request.form.getlist('influencers')
+        print(selected_influencers)
+        
+        if len(selected_influencers) <= 3:
+            selected_data = df[df['Name'].isin(selected_influencers)]
+            print(selected_data)
+            # Create the Credibility Score graph
+            credibility_graph = px.bar(selected_data, x='Name', y='Credibility_Score', title='Comparison of Credibility Scores')
+            credibility_graph = credibility_graph.to_html(full_html=False, include_plotlyjs='cdn')
+            
+            # Create the Rating graph
+            rating_graph = px.bar(selected_data, x='Name', y='Rating', title='Comparison of Ratings')
+            rating_graph = rating_graph.to_html(full_html=False, include_plotlyjs='cdn')
+            
+            return render_template(
+                'compare.html',
+                influencers=influencers_list,
+                credibility_graph=credibility_graph,
+                rating_graph=rating_graph
+            )
+        else:
+            return "Please select up to 3 influencers for comparison."
+
+    return render_template('compare.html', influencers=influencers_list, credibility_graph='', rating_graph='') """
+
+
+
+@app.route('/visualize/keyword_bar')
+def visualize_keyword_bar():
+    keyword_freq = df['Keywords'].str.split(', ').explode().value_counts()
+    fig = px.bar(x=keyword_freq.index, y=keyword_freq.values, title='Keyword Frequency Bar Chart')
+    return fig.to_html()
+
+@app.route('/visualize/scatter_credential_keywords')
+def visualize_scatter_credential_keywords():
+    fig = px.scatter(df, x='Credibility_Score', y='Keywords', title='Scatter Plot: Credibility vs. Keywords')
+    return fig.to_html()
+
+if __name__ == '__main__':
+    app.run(debug=True)
diff --git a/Beta-L/Influencer_dashboard_design/compare.html b/Beta-L/Influencer_dashboard_design/compare.html
new file mode 100644
index 0000000..9de2a2b
--- /dev/null
+++ b/Beta-L/Influencer_dashboard_design/compare.html
@@ -0,0 +1,37 @@
+<!DOCTYPE html>
+<html>
+<head>
+    <title>Compare Influencers</title>
+    <link rel="stylesheet" type="text/css" href="{{ url_for('static', filename='styles.css') }}">
+</head>
+<body>
+    <div class="dashboard-header">
+        <h1>Compare Influencers</h1>
+    </div>
+
+    <div class="dashboard-content">
+        <h2>Select up to 3 influencers for comparison:</h2>
+        <form action="{{ url_for('compare') }}" method="POST">
+            <select name="influencers" multiple size="3">
+                {% for influencer in influencers %}
+                <option value="{{ influencer }}">{{ influencer }}</option>
+                {% endfor %}
+            </select>
+            <button type="submit">Compare</button>
+        </form>
+    </div>
+
+    {% if credibility_graph %}
+    <div class="graphs">
+        <div class="graph">
+            <h3>Comparison of Credibility Scores</h3>
+            {{ credibility_graph|safe }}
+        </div>
+        <div class="graph">
+            <h3>Comparison of Ratings</h3>
+            {{ rating_graph|safe }}
+        </div>
+    </div>
+    {% endif %}
+</body>
+</html>
diff --git a/Beta-L/Influencer_dashboard_design/feedback_form.html b/Beta-L/Influencer_dashboard_design/feedback_form.html
new file mode 100644
index 0000000..9e95256
--- /dev/null
+++ b/Beta-L/Influencer_dashboard_design/feedback_form.html
@@ -0,0 +1,24 @@
+<!DOCTYPE html>
+<html>
+<head>
+    <title>Feedback</title>
+</head>
+<body>
+    <h1>Feedback for Influencer: {{ influencer.Name }}</h1>
+    <form method="POST">
+        <label for="feedback">Feedback:</label><br>
+        <textarea id="feedback" name="feedback" rows="4" cols="50"></textarea><br>
+        <button type="submit">Submit Feedback</button>
+    </form>
+
+    <div>
+        <h2>Previous Feedback:</h2>
+        <ul>
+            {% for feedback_entry in previous_feedback %}
+            <li>{{ feedback_entry }}</li>
+            {% endfor %}
+        </ul>
+    </div>
+
+</body>
+</html>
diff --git a/Beta-L/Influencer_dashboard_design/index.html b/Beta-L/Influencer_dashboard_design/index.html
new file mode 100644
index 0000000..2b1dbeb
--- /dev/null
+++ b/Beta-L/Influencer_dashboard_design/index.html
@@ -0,0 +1,99 @@
+<!DOCTYPE html>
+<html>
+<head>
+    <title>Influencer Dashboard</title>
+    <link rel="stylesheet" type="text/css" href="{{ url_for('static', filename='styles.css') }}">
+
+</head>
+<body>
+    <div class="dashboard-header">
+        <h1>Influencer Dashboard</h1>
+    </div>
+
+    <div class="dashboard-content">
+        <h2>Get insights from Visualizations:</h2>
+        <ul class="visualize-links">
+            <li><a href="{{ url_for('visualize_credential_bar') }}">Credibility Score Distribution</a></li>
+            <li><a href="{{ url_for('visualize_claim_pie') }}">Claim Categories</a></li>
+            <li><a href="{{ url_for('visualize_keyword_bar') }}">Keyword Frequency</a></li>
+            <li><a href="{{ url_for('visualize_scatter_credential_keywords') }}">Credibility vs. Keywords</a></li>
+            <!-- Add links for other visualizations -->
+        </ul>
+
+        <form action="{{ url_for('compare') }}" method="GET">
+            <button type="submit" class="compare-button">Compare Influencers</button>
+        </form>
+
+    </div>
+    <form action="{{ url_for('index') }}" method="GET">
+        <div class="search-bar">
+            <div class="filter-dropdown">
+                <button class="filter-btn">Filter</button>
+                <div class="filter-options">
+                    <select name="filter" id="filter-select">
+                        <option value="claims">Claims</option>
+                        <option value="influencers">Influencers</option>
+                        <option value="keywords">Keywords</option>
+                        <option value="both">ALL</option>
+                    </select>
+                </div>
+            </div>
+            <input type="text" class="search-input" name="keywords" placeholder="Search keywords...">
+            <button type="submit" class="search-btn">
+                <img src="https://th.bing.com/th/id/R.5c74f261278bd23dcd88c3ea4ce12c4d?rik=B76RqcIKqz1hjA&riu=http%3a%2f%2fwww.clipartbest.com%2fcliparts%2faTe%2f64j%2faTe64jRT4.png&ehk=OO6eXUsmOM8Y3Tg9djHsP4VTdKEE9vhn%2fu5oLMAQ%2fHM%3d&risl=&pid=ImgRaw&r=0" alt="Search">
+            </button>
+        </div>
+    </form>
+
+    <script>
+        const filterDropdown = document.querySelector('.filter-dropdown');
+        const filterOptions = document.querySelector('.filter-options');
+
+        filterDropdown.addEventListener('click', () => {
+            filterOptions.classList.toggle('show');
+        });
+
+        // Close the filter options dropdown if the user clicks outside of it
+        window.addEventListener('click', (event) => {
+            if (!filterDropdown.contains(event.target)) {
+                filterOptions.classList.remove('show');
+            }
+        });
+    </script>
+
+
+
+
+    <div class="main">
+        {% for row in rows %}
+        <div class="row">
+            {% for card in row %}
+            <a href="{{ url_for('profile', influencer_name=card.Name, index=loop.index0) }}" class="card-link">
+
+
+                <div class="card">
+                    <div class="image">
+                        <img src="{{ card.image }}">
+                    </div>
+                    <div class="title">
+                        <h1>{{ card.Name }}</h1>
+                        
+
+                    </div>
+                    <div class="scores">
+                        <p><strong>Credibility Score:</strong> {{ card['Credibility_Score'] }}</p>
+                        <p><strong>RATING (1-5):</strong> {{ card.Rating }}</p>
+                    </div>
+                    <div class="des">
+
+                        <a href="{{ url_for('profile', influencer_name=card.Name) }}">Read More...</a>
+                    </div>
+                </div>
+            </a>
+            {% endfor %}
+        </div>
+        {% endfor %}
+    </div>
+
+</body>
+</html>
diff --git a/Beta-L/Influencer_dashboard_design/profile.html b/Beta-L/Influencer_dashboard_design/profile.html
new file mode 100644
index 0000000..11e6580
--- /dev/null
+++ b/Beta-L/Influencer_dashboard_design/profile.html
@@ -0,0 +1,204 @@
+<!DOCTYPE html>
+<html>
+<head>
+    <link rel="stylesheet" type="text/css" href="{{ url_for('static', filename='styles.css') }}">
+
+    <style>
+        /* Custom CSS for styling the profile page */
+        body {
+            font-family: Arial, sans-serif;
+            margin: 0;
+            padding: 0;
+            background-color: #ff6a00; /* Fallback background color */
+            background-image: linear-gradient(to bottom, #f5f5f5, #e0e0e0); /* Gradient background */
+        }
+
+        .container {
+            max-width: 800px;
+            margin: 0 auto;
+            padding: 20px;
+            background-color: burlywood;
+            border-radius: 10px;
+            box-shadow: 0 0 10px rgba(0, 0, 0, 0.1);
+        }
+
+        .profile {
+            padding: 20px;
+            border-bottom: 1px solid #ccc;
+        }
+
+            .profile h2 {
+                color: rgb(0, 0, 0);
+            }
+
+        .feedback-form, .rating-form {
+            padding: 20px;
+            background-color: #eeeadd;
+            margin-top: 20px;
+            border-radius: 5px;
+        }
+
+        .previous-feedback, .previous-ratings {
+            padding: 20px;
+            background-color: #eef0f3;
+            margin-top: 20px;
+            border-radius: 5px;
+        }
+
+        .flagged {
+            color: red;
+            font-weight: bold;
+        }
+
+        .flag-button {
+            background-color: #3498db;
+            color: white;
+            border: none;
+            padding: 5px 10px;
+            border-radius: 5px;
+            cursor: pointer;
+            transition: background-color 0.3s ease-in-out;
+        }
+
+            .flag-button.flagged {
+                background-color: red;
+            }
+    </style>
+
+
+</head>
+<body>
+    <div class="container">
+        <div class="profile">
+            <h2>Name: {{ influencer.Name }}</h2>
+            <br />
+            <p><strong>Credibility Score: </strong>  {{ influencer['Credibility_Score'] }}</p>
+            <br />
+            <p><strong>Explanation:</strong> {{ influencer.Explanation }}</p>
+            <br />
+            <p><strong>Claim:</strong> {{ influencer.Claim }}</p>
+            <br />
+            <p><strong>Keywords:</strong> {{ influencer.Keywords }}</p>
+            <br/>
+            <p><strong>Rating:</strong> {{ influencer.Rating }}</p>
+            <br/>
+            <!-- New information -->
+            <!-- New information -->
+            <p>
+                <strong>Social Network Links:</strong>
+                {% if influencer['Social_Network_Links'] %}
+                <ul>
+                    {% for link in influencer['Social_Network_Links'].split(',') %}
+                    <li> <a href="{{ link }}">{{ link }}</a></li>
+                    {% endfor %}
+                </ul>
+                {% else %}
+                No social network links available.
+                {% endif %}
+            </p>
+
+            <br/>
+
+            <p>
+                <strong>Recent Post Links:</strong>
+                {% if influencer['Recent_Post_Links'] %}
+                <ul>
+                    {% for link in influencer['Recent_Post_Links'].split(',') %}
+                    <li> <a href="{{ link }}">{{ link }}</a> </li>
+                    {% endfor %}
+                </ul>
+                {% else %}
+                No recent post links available.
+                {% endif %}
+            </p>
+        </div>
+
+        <ul>
+            <h3>click here to flag a misleading claim :</h3>
+            {% for claim in influencer.Claim.split(', ') %}
+            <li>
+                {{ claim }}
+                <button class="flag-button" data-influencer="{{ influencer.Name }}" data-claim="{{ claim }}">Flag</button>
+            </li>
+            {% endfor %}
+        </ul>
+
+        <!-- Feedback form -->
+        <div class="feedback-form">
+            <h3>Provide Feedback:</h3>
+            <form method="POST" action="{{ url_for('feedback' , influencer_name=influencer.Name) }}">
+                <label for="feedback">Feedback:</label><br>
+                <textarea id="feedback" name="feedback" rows="4" cols="50"></textarea><br>
+                <button type="submit">Submit Feedback</button>
+            </form>
+        </div>
+
+        <!-- Display previous feedback -->
+        <div class="previous-feedback">
+            <h3>Previous Feedback:</h3>
+            <ul>
+                {% for feedback_entry in previous_feedback %}
+                <li>{{ feedback_entry }}</li>
+                {% endfor %}
+            </ul>
+        </div>
+
+        <!-- Rating form -->
+        <div class="rating-form">
+            <h3>Rate Influencer:</h3>
+            <form method="POST" action="{{ url_for('rate', influencer_name=influencer.Name) }}">
+                <label for="rating">Rating (1-5):</label><br>
+                <input type="number" id="rating" name="rating" min="1" max="5"><br>
+                <button type="submit">Submit Rating</button>
+            </form>
+        </div>
+
+        <!-- Display previous ratings -->
+        <div class="previous-ratings">
+            <h3>Previous Ratings:</h3>
+            <ul>
+                {% for rating in previous_ratings %}
+                <li>{{ rating }}</li>
+                {% endfor %}
+            </ul>
+        </div>
+
+
+
+
+
+
+    </div>
+
+    <script>
+        document.addEventListener("DOMContentLoaded", function () {
+            const flagButtons = document.querySelectorAll(".flag-button");
+
+            flagButtons.forEach(button => {
+                button.addEventListener("click", function () {
+                    const influencer = this.getAttribute("data-influencer");
+                    const claim = this.getAttribute("data-claim");
+                    const button = this;
+
+                    // Toggle the flagged class
+                    button.classList.toggle("flagged");
+
+                    // Send an AJAX request to flag the claim
+                    fetch(`/flag_claim/${influencer}/${claim}`, { method: "POST" })
+                        .then(response => {
+                            if (!response.ok) {
+                                // Handle error
+                                console.error("Failed to flag claim:", response.statusText);
+                                button.classList.remove("flagged"); // Revert the change
+                            }
+                        })
+                        .catch(error => {
+                            console.error("An error occurred:", error);
+                            button.classList.remove("flagged"); // Revert the change
+                        });
+                });
+            });
+        });
+    </script>
+</body>
+</html>
diff --git a/Beta-L/Influencer_dashboard_design/rating_form.html b/Beta-L/Influencer_dashboard_design/rating_form.html
new file mode 100644
index 0000000..05d0d56
--- /dev/null
+++ b/Beta-L/Influencer_dashboard_design/rating_form.html
@@ -0,0 +1,24 @@
+<!DOCTYPE html>
+<html>
+<head>
+    <title>Rating</title>
+</head>
+<body>
+    <h1>Rate Influencer: {{ influencer.Name }}</h1>
+    <form method="POST">
+        <label for="rating">Rating (1-5):</label><br>
+        <input type="number" id="rating" name="rating" min="1" max="5"><br>
+        <button type="submit">Submit Rating</button>
+    </form>
+
+    <div>
+        <h2>Previous Ratings:</h2>
+        <ul>
+            {% for rating in previous_ratings %}
+            <li>{{ rating }}</li>
+            {% endfor %}
+        </ul>
+    </div>
+
+</body>
+</html>
diff --git a/Beta-L/Influencer_dashboard_design/styles.css b/Beta-L/Influencer_dashboard_design/styles.css
new file mode 100644
index 0000000..d9659e6
--- /dev/null
+++ b/Beta-L/Influencer_dashboard_design/styles.css
@@ -0,0 +1,288 @@
+/* Reset some default styles */
+body, h1, h2, h3, h4, h5, h6, p, ul, ol, li {
+    margin: 0;
+    padding: 0;
+}
+
+body {
+    font-family: Arial, sans-serif;
+    background-color: #f5f5f5;
+    color: #333;
+}
+
+.container {
+    max-width: 1200px;
+    margin: 0 auto;
+    padding: 20px;
+}
+
+.header {
+    background-color: #4cff00;
+    color: #fff;
+    text-align: center;
+    padding: 20px;
+    margin-bottom: 20px;
+    border-radius: 10px;
+}
+
+.action-links {
+    padding-top: 10px;
+    background-color: #f9f9f9;
+    border-bottom: 1px solid #ddd;
+    margin-bottom: 20px;
+    border-radius: 10px;
+}
+
+    .action-links a {
+        margin-right: 10px;
+        color: #3498db;
+        text-decoration: none;
+        transition: color 0.3s;
+    }
+
+        .action-links a:hover {
+            color: #217dbb;
+        }
+
+.visualize-links ul {
+    list-style: none;
+    padding: 0;
+}
+
+.visualize-links li {
+    margin-bottom: 10px;
+}
+
+.visualize-links a {
+    color: #ff6a00;
+    text-decoration: none;
+    transition: color 0.3s;
+}
+
+    .visualize-links a:hover {
+        color: #217dbb;
+    }
+
+/* Apply Filters Form */
+form {
+    margin-bottom: 20px;
+}
+
+    form label {
+        margin-right: 10px;
+    }
+
+/* Apply Filters Button */
+button[type="submit"] {
+    background-color: #3498db;
+    color: #fff;
+    border: none;
+    padding: 10px 20px;
+    border-radius: 5px;
+    cursor: pointer;
+    transition: background-color 0.3s, color 0.3s;
+}
+
+  q  button[type="submit"]:hover {
+        background-color: #217dbb;
+    }
+
+/* Dashboard Styling */
+.dashboard-header {
+    background-color: #0094ff;
+    color: #f5f5f5;
+    text-align: center;
+    padding: 20px;
+    border-radius: 10px;
+    margin-bottom: 20px;
+}
+
+.dashboard-content {
+    text-align: center;
+    margin-top: 20px;
+    padding: 20px;
+    background-color: #f9f9f9;
+    border-radius: 10px;
+}
+
+    .dashboard-content h2 {
+        margin-bottom: 10px;
+    }
+
+/* Card UI styles */
+.main {
+    margin: 20px;
+}
+
+.row {
+    display: flex;
+    justify-content: space-between;
+    align-items: stretch;
+    margin-bottom: 20px;
+    
+}
+
+.card {
+    width: calc(30.33% - 20px);
+    box-shadow: 0px 0px 10px rgba(0, 0, 0, 0.2);
+    border-radius: 5px;
+    margin-right: 20px;
+    background-color: #fff;
+    overflow: hidden;
+    position: relative;
+}
+
+
+
+*.image img{
+    height: 170px;
+    width: 100%;
+    text-align: center;
+    border-top-left-radius: 5px;
+    border-top-right-radius: 5px;
+    
+} 
+
+.title {
+    text-align: center;
+    padding: 10px;
+    background-color: #333;
+    color: #fff;
+    position: relative;
+}
+
+.scores {
+    text-align: center;
+    font-size: 14px;
+    color: #000000;
+    margin-top: 5px;
+}
+
+h1 {
+    font-size: 20px;
+}
+
+.des {
+    text-align: center;
+    padding: 10px;
+    border-bottom-left-radius: 5px;
+    border-bottom-right-radius: 5px;
+    background-color: #f5f5f5;
+}
+
+button {
+    margin-top: 10px;
+    background-color: #333;
+    color: #fff;
+    border: none;
+    border-radius: 5px;
+    padding: 5px 10px;
+    cursor: pointer;
+}
+
+    button:hover {
+        background-color: #555;
+    }
+
+
+/* Style for the search bar container */
+.search-bar {
+    display: flex;
+    align-items: center;
+    background-color: #f5f5f5;
+    padding: 10px;
+    border-radius: 5px;
+    box-shadow: 0px 2px 4px rgba(0, 0, 0, 0.1);
+}
+
+/* Style for the filter dropdown container */
+.filter-dropdown {
+    position: relative;
+    margin-right: 10px;
+    cursor: pointer;
+}
+
+/* Style for the filter button */
+.filter-btn {
+    color: #000
+    background-color: #fff;
+    border: 1px solid #ccc;
+    padding: 5px 10px;
+    border-radius: 5px;
+    cursor: pointer;
+}
+
+/* Style for the filter options */
+.filter-options {
+    display: none;
+    position: absolute;
+    background-color: #fff;
+    border: 1px solid #ccc;
+    border-radius: 5px;
+    top: 30px;
+    left: 0;
+    width: 100px;
+    z-index: 1;
+}
+
+    /* Style for the filter options links */
+    .filter-options a {
+        display: block;
+        padding: 5px 10px;
+        text-decoration: none;
+        color: #333;
+        transition: background-color 0.3s;
+    }
+
+        .filter-options a:hover {
+            background-color: #f5f5f5;
+        }
+
+/* Show filter options when the filter button is clicked */
+.filter-dropdown:hover .filter-options {
+
+    display: block;
+}
+
+/* Style for the search input */
+.search-input {
+    flex: 1;
+    border: none;
+    padding: 8px;
+    border-radius: 5px;
+}
+
+/* Style for the search button */
+.search-btn {
+    background-color: #3498db;
+    border: none;
+    padding: 8px;
+    border-radius: 5px;
+    cursor: pointer;
+    transition: background-color 0.3s;
+}
+
+    .search-btn img {
+        width: 20px;
+        height: 20px;
+    }
+
+    .search-btn:hover {
+        background-color: #217dbb;
+    }
+
+.flagged {
+    background-color: red;
+}
+
+/* Add this in your styles.css */
+.compare-button {
+    background-color: #3498db;
+    color: white;
+    border: none;
+    padding: 10px 20px;
+    border-radius: 5px;
+    cursor: pointer;
+    font-size: 16px;
+    margin-top: 20px;
+}
diff --git a/Beta-L/Influencer_dashboard_design/visualize.html b/Beta-L/Influencer_dashboard_design/visualize.html
new file mode 100644
index 0000000..265d1fe
--- /dev/null
+++ b/Beta-L/Influencer_dashboard_design/visualize.html
@@ -0,0 +1,17 @@
+<!DOCTYPE html>
+<html>
+<head>
+    <title>Visualizations</title>
+</head>
+<body>
+    <h1>Available Visualizations</h1>
+    <ul>
+        <li><a href="{{ url_for('visualize_credential_bar') }}">Credibility Score Distribution</a></li>
+        <li><a href="{{ url_for('visualize_claim_pie') }}">Claim Categories</a></li>
+        <li><a href="{{ url_for('visualize_keyword_bar') }}">Keyword Frequency </a></li>
+        <li><a href="{{ url_for('visualize_scatter_credential_keywords') }}">Credibility vs. Keywords</a></li>
+        <!-- Add links for other visualizations -->
+    </ul>
+    <a href="{{ url_for('index') }}">Back to Dashboard</a>
+</body>
+</html>
diff --git a/Beta-L/Ml_codes/Assign_credibility_scores_to_influencers_and_claims_using_Scikit_learn_and_TensorFlow.ipynb b/Beta-L/Ml_codes/Assign_credibility_scores_to_influencers_and_claims_using_Scikit_learn_and_TensorFlow.ipynb
new file mode 100644
index 0000000..49f2d88
--- /dev/null
+++ b/Beta-L/Ml_codes/Assign_credibility_scores_to_influencers_and_claims_using_Scikit_learn_and_TensorFlow.ipynb
@@ -0,0 +1,203 @@
+{
+  "cells": [
+    {
+      "cell_type": "code",
+      "execution_count": null,
+      "metadata": {
+        "colab": {
+          "background_save": true,
+          "base_uri": "https://localhost:8080/"
+        },
+        "id": "oGnu0h9yf9T0",
+        "outputId": "456cb1e0-31d3-41e2-d3a0-4501a440d68b"
+      },
+      "outputs": [
+        {
+          "name": "stdout",
+          "output_type": "stream",
+          "text": [
+            "\n",
+            "    If ticker of Indian Stock Market, add \".NS\" at last\n",
+            "    For example -- \"ADANIPOWER.NS\" for Adani Power\n",
+            "                -- \"TATAMOTORS.NS\" for Tata Motors\n",
+            "\n"
+          ]
+        }
+      ],
+      "source": [
+        "import numpy as np\n",
+        "import pandas as pd\n",
+        "import matplotlib.pyplot as plt\n",
+        "import pandas_datareader as web\n",
+        "import datetime as dt\n",
+        "from sklearn.manifold import trustworthiness\n",
+        "\n",
+        "from sklearn.preprocessing import MinMaxScaler\n",
+        "from tensorflow.python.keras.models import Sequential\n",
+        "from tensorflow.python.keras.layers import Dense, Dropout, LSTM\n",
+        "\n",
+        "# Load Data\n",
+        "print(\"\"\"\n",
+        "    If ticker of Indian Stock Market, add \".NS\" at last\n",
+        "    For example -- \"ADANIPOWER.NS\" for Adani Power\n",
+        "                -- \"TATAMOTORS.NS\" for Tata Motors\n",
+        "\"\"\")\n",
+        "\n",
+        "company = input(\"Enter ticker symbol :\" ).upper()\n",
+        "\n",
+        "start = dt.datetime(2012,1,1)\n",
+        "end = dt.datetime(2022,1,1)\n",
+        "\n",
+        "data = web.DataReader(company, 'yahoo', start, end)\n",
+        "# Prepare Data\n",
+        "scaler = MinMaxScaler(feature_range=(0,1))\n",
+        "scaled_data = scaler.fit_transform(data['Close'].values.reshape(-1,1))\n",
+        "prediction_days = 60\n",
+        "x_train = []\n",
+        "y_train = []\n",
+        "\n",
+        "print(\"Collecting data...\")\n",
+        "\n",
+        "for x in range(prediction_days, len(scaled_data)):\n",
+        "    x_train.append(scaled_data[x-prediction_days:x,0])\n",
+        "    y_train.append(scaled_data[x,0])\n",
+        "\n",
+        "# Converting to numpy arrays\n",
+        "\n",
+        "x_train, y_train = np.array(x_train), np.array(y_train)\n",
+        "x_train = np.reshape(x_train,(x_train.shape[0],x_train.shape[1],1))\n",
+        "\n",
+        "print(\"Initializing...\")\n",
+        "\n",
+        "# Training Model\n",
+        "\n",
+        "model = Sequential()\n",
+        "model.add(LSTM(units=50, return_sequences=True, input_shape=(x_train.shape[1],1)))\n",
+        "model.add(Dropout(0.2))\n",
+        "model.add(LSTM(units=50, return_sequences=True))\n",
+        "model.add(Dropout(0.2))\n",
+        "model.add(LSTM(units=50, return_sequences=True))\n",
+        "model.add(Dropout(0.2))\n",
+        "model.add(LSTM(units=50))\n",
+        "model.add(Dropout(0.2))\n",
+        "model.add(Dense(units=1)) # Prediction for next price\n",
+        "\n",
+        "\n",
+        "model.compile(optimizer='adam', loss='mean_squared_error')\n",
+        "model.fit(x_train, y_train, epochs=5, batch_size=32)\n",
+        "\n",
+        "# Testing\n",
+        "\n",
+        "test_start = dt.datetime(2020,1,1)\n",
+        "test_end = dt.datetime(2022,1,1)\n",
+        "\n",
+        "test_data = web.DataReader(company, 'yahoo', test_start, test_end)\n",
+        "actual_price = test_data['Close'].values\n",
+        "\n",
+        "total_dataset = pd.concat((data['Close'], test_data['Close']), axis=0)\n",
+        "\n",
+        "model_inputs = total_dataset[len(total_dataset) - len(test_data) - prediction_days:].values\n",
+        "model_inputs = model_inputs.reshape(-1,1)\n",
+        "model_inputs = scaler.transform(model_inputs)\n",
+        "\n",
+        "# Prediction\n",
+        "\n",
+        "x_test = []\n",
+        "\n",
+        "print(\"Predicting...\")\n",
+        "\n",
+        "for x in range(prediction_days, len(model_inputs)):\n",
+        "    x_test.append(model_inputs[x-prediction_days:x,0])\n",
+        "\n",
+        "x_test = np.array(x_test)\n",
+        "x_test = np.reshape(x_test, (x_test.shape[0], x_test.shape[1], 1))\n",
+        "\n",
+        "predicted_prices = model.predict(x_test)\n",
+        "predicted_prices = scaler.inverse_transform(predicted_prices)\n",
+        "\n",
+        "# Prediction for next day\n",
+        "\n",
+        "\n",
+        "real_data = [model_inputs[len(model_inputs) + 1 - prediction_days:len(model_inputs+1), 0]]\n",
+        "real_data = np.array(real_data)\n",
+        "real_data = np.reshape(real_data,(real_data.shape[0],real_data.shape[1],1))\n",
+        "\n",
+        "prediction = model.predict(real_data)\n",
+        "prediction = scaler.inverse_transform(prediction)\n",
+        "print(f\"Prediction {prediction} \")\n",
+        "\n",
+        "# Ploting the prediction\n",
+        "\n",
+        "plt.plot(actual_price, color=\"blue\", label=f\"Actual {company} price...\")\n",
+        "plt.plot(predicted_prices, color=\"green\", label=f\"Predicted {company} price...\")\n",
+        "plt.title(f'{company} share prices...')\n",
+        "plt.xlabel(\"Time\")\n",
+        "plt.ylabel(f\"{company} share price\")\n",
+        "plt.legend()\n",
+        "plt.show()\n",
+        "\n",
+        "\n"
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "1wq-ZJRaacpk"
+      },
+      "source": [
+        "supervised algorithm for assigning credibility scores to influencers and claims using Scikit-learn and TensorFlow in Indian stock markets using machine learning and deep learning techniques:\n",
+        "\n",
+        "1)Collect a dataset of historical data on stock prices, influencers, and claims. This data can be scraped from social media platforms, news websites, and other sources.\n",
+        "2)Preprocess the data by cleaning it and removing any noise.\n",
+        "3)Feature engineer the data by extracting the relevant features. The features that you can consider include:\n",
+        "Whether the influencer is registered as an advisor with SEBI\n",
+        "Whether they follow SEBI’s registered advisor guidelines\n",
+        "Whether they have any action pending from SEBI\n",
+        "Whether they disclose any commission or conflict of interest\n",
+        "Whether they provide evidence or references for their claim\n",
+        "Whether they have a consistent track record of performance\n",
+        "Whether they have a large and engaged following\n",
+        "4)Train a supervised learning model on the preprocessed data. You can use a model such as logistic regression, support vector machines, or random forests.\n",
+        "5)Evaluate the performance of the model on a held-out test set.\n",
+        "6)Use the model to assign credibility scores to new influencers and claims.\n",
+        "\n",
+        "Here are some specific algorithms that you could use:\n",
+        "\n",
+        "Logistic regression: This is a simple but effective algorithm that can be used for binary classification tasks. In this case, the binary classification task would be to classify whether an influencer or claim is credible or not.\n",
+        "Support vector machine: This is a more powerful algorithm that can be used for both binary and multi-class classification tasks. It is generally more accurate than logistic regression, but it can also be more computationally expensive.\n",
+        "Random forest: This is an ensemble learning algorithm that combines the predictions of multiple decision trees. It is often more accurate than logistic regression or support vector machines, but it can also be more computationally expensive.\n",
+        "The specific algorithm that you choose will depend on the size and complexity of your dataset, as well as the desired accuracy of the model.\n",
+        "\n",
+        "Scikit-learn is a popular Python library for machine learning. It provides implementations of many supervised learning algorithms, including logistic regression, support vector machines, and random forests. TensorFlow is another popular Python library for machine learning. It is a more general-purpose library that can be used for both supervised and unsupervised learning tasks.\n",
+        "\n",
+        "The following are some of the challenges that you might face when developing a supervised algorithm for assigning credibility scores to influencers and claims in Indian stock markets:\n",
+        "\n",
+        "The data is often noisy and incomplete.\n",
+        "The data is often biased.\n",
+        "The data is constantly changing.\n",
+        "It can be difficult to define what constitutes a credible influencer or claim.\n",
+        "Despite these challenges, it is possible to develop a supervised algorithm for assigning credibility scores to influencers and claims in Indian stock markets. By carefully cleaning and feature engineering the data, and by using a supervised learning model, you can develop a model that can be used to assign credibility scores to new influencers and claims with a high degree of accuracy.\n",
+        "\n",
+        "Here are some additional considerations for developing a supervised algorithm for assigning credibility scores to influencers and claims in Indian stock markets:\n",
+        "\n",
+        "The algorithm should be transparent and accountable. Users should be able to understand how the algorithm works and why it assigns the credibility scores that it does.\n",
+        "The algorithm should be fair and unbiased. It should not discriminate against any particular group of influencers or claims.\n",
+        "The algorithm should be robust to changes in the data. It should continue to work accurately even if the data changes over time."
+      ]
+    }
+  ],
+  "metadata": {
+    "colab": {
+      "provenance": []
+    },
+    "kernelspec": {
+      "display_name": "Python 3",
+      "name": "python3"
+    },
+    "language_info": {
+      "name": "python"
+    }
+  },
+  "nbformat": 4,
+  "nbformat_minor": 0
+}
\ No newline at end of file
diff --git a/Beta-L/Ml_codes/Extract_relevant_information_from_the_data_using_NLTK.ipynb b/Beta-L/Ml_codes/Extract_relevant_information_from_the_data_using_NLTK.ipynb
new file mode 100644
index 0000000..b76fe97
--- /dev/null
+++ b/Beta-L/Ml_codes/Extract_relevant_information_from_the_data_using_NLTK.ipynb
@@ -0,0 +1,119 @@
+{
+  "nbformat": 4,
+  "nbformat_minor": 0,
+  "metadata": {
+    "colab": {
+      "provenance": []
+    },
+    "kernelspec": {
+      "name": "python3",
+      "display_name": "Python 3"
+    },
+    "language_info": {
+      "name": "python"
+    }
+  },
+  "cells": [
+    {
+      "cell_type": "code",
+      "source": [
+        "import nltk\n",
+        "\n",
+        "def extract_relevant_information(text):\n",
+        "  \"\"\"Extracts relevant information from the text using NLTK.\n",
+        "\n",
+        "  Args:\n",
+        "    text: The text to extract information from.\n",
+        "\n",
+        "  Returns:\n",
+        "    A dictionary of extracted information.\n",
+        "  \"\"\"\n",
+        "\n",
+        "  # Tokenize the text\n",
+        "  tokens = nltk.word_tokenize(text)\n",
+        "\n",
+        "  # Find the name and profile of the influencer\n",
+        "  influencer = tokens[tokens.index(\"@\") + 1]\n",
+        "  profile = \"Twitter user\"\n",
+        "\n",
+        "  # Find the content and tone of the claim\n",
+        "  claim = \" \".join(tokens[tokens.index(\"that\") + 1:])\n",
+        "  tone = \"negative\"\n",
+        "\n",
+        "  # Find the date and time of the post\n",
+        "  date = tokens[tokens.index(\"on\") + 1]\n",
+        "  time = tokens[tokens.index(\"at\") + 1]\n",
+        "\n",
+        "  # Find the number and sentiment of the comments\n",
+        "  number_of_comments = int(tokens[tokens.index(\"over\") + 1])\n",
+        "  sentiment_of_comments = \"negative\"\n",
+        "\n",
+        "  # Create a dictionary of extracted information\n",
+        "  extracted_information = {\n",
+        "      \"influencer\": influencer,\n",
+        "      \"profile\": profile,\n",
+        "      \"claim\": claim,\n",
+        "      \"tone\": tone,\n",
+        "      \"date\": date,\n",
+        "      \"time\": time,\n",
+        "      \"number_of_comments\": number_of_comments,\n",
+        "      \"sentiment_of_comments\": sentiment_of_comments,\n",
+        "  }\n",
+        "\n",
+        "  return extracted_information\n",
+        "\n",
+        "\n",
+        "if __name__ == \"__main__\":\n",
+        "  # Get the text\n",
+        "  text = \"Influencer @johndoe posted a claim on Twitter that the new COVID-19 vaccine is dangerous. The post received over 1000 comments, most of which were negative.\"\n",
+        "\n",
+        "  # Extract the relevant information\n",
+        "  extracted_information = extract_relevant_information(text)\n",
+        "\n",
+        "  # Print the extracted information\n",
+        "  print(extracted_information)\n"
+      ],
+      "metadata": {
+        "id": "pUguyw0sX3F_"
+      },
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "markdown",
+      "source": [
+        "Introduction :extracting relevant information from the data using NLTK:\n",
+        "\n",
+        "1)Tokenization: This is the process of breaking the text into individual words or tokens. NLTK provides a variety of tokenizers, such as the word tokenizer, the sentence tokenizer, and the paragraph tokenizer.\n",
+        "\n",
+        "2)Stemming: This is the process of reducing a word to its root form. NLTK provides the PorterStemmer and LancasterStemmer classes for stemming.\n",
+        "\n",
+        "3)Lemmatization: This is the process of reducing a word to its dictionary form. NLTK provides the WordNetLemmatizer class for lemmatization.\n",
+        "Part-of-speech tagging: This is the process of assigning a part-of-speech tag to each word in the text. NLTK provides the POSTagger class for part-of-speech tagging.\n",
+        "\n",
+        "4)Named entity recognition: This is the process of identifying named entities in the text, such as people, organizations, and places. NLTK provides the NERecognizer class for named entity recognition.\n",
+        "\n",
+        "5)Sentiment analysis: This is the process of determining the sentiment of a piece of text, such as whether it is positive, negative, or neutral. NLTK provides the SentimentAnalyzer class for sentiment analysis.\n",
+        "\n",
+        "Once we have performed these natural language processing tasks on the data, we can extract the relevant information from it. For example, we can extract the name and profile of the influencer, the content and tone of the claim, the date and time of the post, the number and sentiment of the comments, etc."
+      ],
+      "metadata": {
+        "id": "FzR3QvQeX8X4"
+      }
+    },
+    {
+      "cell_type": "markdown",
+      "source": [],
+      "metadata": {
+        "id": "_C-U_vDgXlmU"
+      }
+    },
+    {
+      "cell_type": "markdown",
+      "source": [],
+      "metadata": {
+        "id": "xqnHN_Y-XdU0"
+      }
+    }
+  ]
+}
\ No newline at end of file
diff --git a/Beta-L/Ml_codes/Stock_direction_prediction.ipynb b/Beta-L/Ml_codes/Stock_direction_prediction.ipynb
new file mode 100644
index 0000000..695db5c
--- /dev/null
+++ b/Beta-L/Ml_codes/Stock_direction_prediction.ipynb
@@ -0,0 +1,1821 @@
+{
+  "nbformat": 4,
+  "nbformat_minor": 0,
+  "metadata": {
+    "colab": {
+      "name": "Stock direction prediction.ipynb",
+      "provenance": [],
+      "collapsed_sections": []
+    },
+    "kernelspec": {
+      "name": "python3",
+      "display_name": "Python 3"
+    },
+    "accelerator": "GPU"
+  },
+  "cells": [
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "oMXGjAmvm3bw",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 357
+        },
+        "outputId": "b523ba6e-cb40-4fce-bd41-13ef03aa45b3"
+      },
+      "source": [
+        "!nvidia-smi"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Mon Sep 14 14:38:42 2020       \n",
+            "+-----------------------------------------------------------------------------+\n",
+            "| NVIDIA-SMI 450.66       Driver Version: 418.67       CUDA Version: 10.1     |\n",
+            "|-------------------------------+----------------------+----------------------+\n",
+            "| GPU  Name        Persistence-M| Bus-Id        Disp.A | Volatile Uncorr. ECC |\n",
+            "| Fan  Temp  Perf  Pwr:Usage/Cap|         Memory-Usage | GPU-Util  Compute M. |\n",
+            "|                               |                      |               MIG M. |\n",
+            "|===============================+======================+======================|\n",
+            "|   0  Tesla T4            Off  | 00000000:00:04.0 Off |                    0 |\n",
+            "| N/A   34C    P8     9W /  70W |      0MiB / 15079MiB |      0%      Default |\n",
+            "|                               |                      |                 ERR! |\n",
+            "+-------------------------------+----------------------+----------------------+\n",
+            "                                                                               \n",
+            "+-----------------------------------------------------------------------------+\n",
+            "| Processes:                                                                  |\n",
+            "|  GPU   GI   CI        PID   Type   Process name                  GPU Memory |\n",
+            "|        ID   ID                                                   Usage      |\n",
+            "|=============================================================================|\n",
+            "|  No running processes found                                                 |\n",
+            "+-----------------------------------------------------------------------------+\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "fvMiVpfanBxq",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 35
+        },
+        "outputId": "186d1ce5-9daf-4a27-a97c-94a06b814f1a"
+      },
+      "source": [
+        "import ta\n",
+        "import tqdm\n",
+        "import numpy as np\n",
+        "import pandas as pd\n",
+        "import matplotlib.pyplot as plt\n",
+        "%matplotlib inline\n",
+        "\n",
+        "from sklearn.preprocessing import StandardScaler\n",
+        "from sklearn.model_selection import train_test_split\n",
+        "from sklearn.decomposition import PCA\n",
+        "from sklearn.linear_model import LogisticRegression\n",
+        "from sklearn.tree import DecisionTreeClassifier\n",
+        "from sklearn.svm import SVC\n",
+        "from sklearn.gaussian_process import GaussianProcessClassifier\n",
+        "from sklearn.gaussian_process.kernels import RBF\n",
+        "from sklearn.neighbors import KNeighborsClassifier\n",
+        "from sklearn.ensemble import RandomForestClassifier, GradientBoostingClassifier, StackingClassifier\n",
+        "from sklearn.pipeline import Pipeline\n",
+        "from sklearn.metrics import accuracy_score, f1_score, roc_auc_score\n",
+        "\n",
+        "import tensorflow as tf\n",
+        "print(f'TensorFlow version: {tf.__version__}')"
+      ],
+      "execution_count": 1,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "TensorFlow version: 2.3.0\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "_MNmGI3VnEmE",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 204
+        },
+        "outputId": "51fae6e2-ae21-4182-981d-33f9c73dea76"
+      },
+      "source": [
+        "!wget https://raw.githubusercontent.com/dksifoua/Stock-Market-Prediction/master/data/2019_AAPL_1min.csv"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "--2020-09-14 14:31:21--  https://raw.githubusercontent.com/dksifoua/Stock-Market-Prediction/master/data/2019_AAPL_1min.csv\n",
+            "Resolving raw.githubusercontent.com (raw.githubusercontent.com)... 151.101.0.133, 151.101.64.133, 151.101.128.133, ...\n",
+            "Connecting to raw.githubusercontent.com (raw.githubusercontent.com)|151.101.0.133|:443... connected.\n",
+            "HTTP request sent, awaiting response... 200 OK\n",
+            "Length: 6092763 (5.8M) [text/plain]\n",
+            "Saving to: ‘2019_AAPL_1min.csv.1’\n",
+            "\n",
+            "2019_AAPL_1min.csv. 100%[===================>]   5.81M  34.4MB/s    in 0.2s    \n",
+            "\n",
+            "2020-09-14 14:31:22 (34.4 MB/s) - ‘2019_AAPL_1min.csv.1’ saved [6092763/6092763]\n",
+            "\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "yrN21LvAnGLE",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 252
+        },
+        "outputId": "dca59956-fa06-4ffa-a09a-2e807f9e923e"
+      },
+      "source": [
+        "df = pd.read_csv('./2019_AAPL_1min.csv', header=0, index_col=0)\n",
+        "df.index = pd.to_datetime(df.index).tz_localize(None).to_period('T')\n",
+        "df = df.drop(['open', 'high', 'low'], axis=1)\n",
+        "print(df.shape)\n",
+        "df.head()"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "(101081, 2)\n"
+          ],
+          "name": "stdout"
+        },
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/html": [
+              "<div>\n",
+              "<style scoped>\n",
+              "    .dataframe tbody tr th:only-of-type {\n",
+              "        vertical-align: middle;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe tbody tr th {\n",
+              "        vertical-align: top;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe thead th {\n",
+              "        text-align: right;\n",
+              "    }\n",
+              "</style>\n",
+              "<table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              "    <tr style=\"text-align: right;\">\n",
+              "      <th></th>\n",
+              "      <th>close</th>\n",
+              "      <th>volume</th>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>date</th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 14:30</th>\n",
+              "      <td>154.780</td>\n",
+              "      <td>3223.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 14:31</th>\n",
+              "      <td>155.325</td>\n",
+              "      <td>1674.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 14:32</th>\n",
+              "      <td>154.850</td>\n",
+              "      <td>3153.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 14:33</th>\n",
+              "      <td>154.600</td>\n",
+              "      <td>5104.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 14:34</th>\n",
+              "      <td>154.760</td>\n",
+              "      <td>2948.0</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n",
+              "</div>"
+            ],
+            "text/plain": [
+              "                    close  volume\n",
+              "date                             \n",
+              "2019-01-02 14:30  154.780  3223.0\n",
+              "2019-01-02 14:31  155.325  1674.0\n",
+              "2019-01-02 14:32  154.850  3153.0\n",
+              "2019-01-02 14:33  154.600  5104.0\n",
+              "2019-01-02 14:34  154.760  2948.0"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 5
+        }
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "D92HLEwqoDHL",
+        "colab_type": "text"
+      },
+      "source": [
+        "# Data processing\n",
+        "\n",
+        "**Add targets**\n",
+        "\n",
+        "The target to be predicted in the $i^{th}$ day is calculated as follows:\n",
+        "\n",
+        "$$target_i = sign(P_{i+d} - P_i)$$\n",
+        "\n",
+        "Where $d$ is the number of minutes/days after which the prediction is to be made"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "TTJxOQPbnJHn",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 235
+        },
+        "outputId": "8adcf5b0-c99a-404b-cd59-6b49966e0d2b"
+      },
+      "source": [
+        "df['label'] = df.close.shift(-1) - df.close\n",
+        "df.label = df.label.apply(lambda x: 0 if x < 0 else 1)\n",
+        "df.head()"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/html": [
+              "<div>\n",
+              "<style scoped>\n",
+              "    .dataframe tbody tr th:only-of-type {\n",
+              "        vertical-align: middle;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe tbody tr th {\n",
+              "        vertical-align: top;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe thead th {\n",
+              "        text-align: right;\n",
+              "    }\n",
+              "</style>\n",
+              "<table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              "    <tr style=\"text-align: right;\">\n",
+              "      <th></th>\n",
+              "      <th>close</th>\n",
+              "      <th>volume</th>\n",
+              "      <th>label</th>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>date</th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 14:30</th>\n",
+              "      <td>154.780</td>\n",
+              "      <td>3223.0</td>\n",
+              "      <td>1</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 14:31</th>\n",
+              "      <td>155.325</td>\n",
+              "      <td>1674.0</td>\n",
+              "      <td>0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 14:32</th>\n",
+              "      <td>154.850</td>\n",
+              "      <td>3153.0</td>\n",
+              "      <td>0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 14:33</th>\n",
+              "      <td>154.600</td>\n",
+              "      <td>5104.0</td>\n",
+              "      <td>1</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 14:34</th>\n",
+              "      <td>154.760</td>\n",
+              "      <td>2948.0</td>\n",
+              "      <td>0</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n",
+              "</div>"
+            ],
+            "text/plain": [
+              "                    close  volume  label\n",
+              "date                                    \n",
+              "2019-01-02 14:30  154.780  3223.0      1\n",
+              "2019-01-02 14:31  155.325  1674.0      0\n",
+              "2019-01-02 14:32  154.850  3153.0      0\n",
+              "2019-01-02 14:33  154.600  5104.0      1\n",
+              "2019-01-02 14:34  154.760  2948.0      0"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 6
+        }
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "ZTi4U9H9oJz6",
+        "colab_type": "text"
+      },
+      "source": [
+        "**Technical indicators**"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "EJxdpD21qXuf",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 425
+        },
+        "outputId": "7ecb8cdd-96a7-448f-d85e-be667297fcce"
+      },
+      "source": [
+        "# Momentum indicators\n",
+        "df['roc'] = ta.momentum.roc(close=df.close) # Rate of Change (ROC)\n",
+        "df['rsi'] = ta.momentum.rsi(close=df.close) # Relative Strength Index (RSI)\n",
+        "df['tsi'] = ta.momentum.tsi(close=df.close) # True strength index (TSI)\n",
+        "\n",
+        "# Volatility indicators\n",
+        "bb_indicator = ta.volatility.BollingerBands(close=df.close)\n",
+        "df['bb_bbhi'] = bb_indicator.bollinger_hband_indicator() # Bollinger Band high indicator\n",
+        "df['bb_bbli'] = bb_indicator.bollinger_lband_indicator() # Bollinger Band low indicator\n",
+        "\n",
+        "# Trend indicators\n",
+        "aroon_indicator = ta.trend.AroonIndicator(close=df.close)\n",
+        "macd_indicator = ta.trend.MACD(close=df.close)\n",
+        "kst_indicator = ta.trend.KSTIndicator(close=df.close)\n",
+        "df['aroon_down'] = aroon_indicator.aroon_down() # Aroon Down Channel\n",
+        "df['aroon'] = aroon_indicator.aroon_indicator() # Aroon Indicator\n",
+        "df['aroon_up'] = aroon_indicator.aroon_up() # Aroon Up Channel\n",
+        "df['macd_line'] = macd_indicator.macd() # MACD Line\n",
+        "df['macd_hist'] = macd_indicator.macd_diff() # MACD Histogram\n",
+        "df['macd_signal'] = macd_indicator.macd_signal() # MACD Signal Line\n",
+        "df['kst'] = kst_indicator.kst() # Know Sure Thing (KST)\n",
+        "df['kst_diff'] = kst_indicator.kst_diff() # Diff Know Sure Thing (KST)\n",
+        "df['kst_signal'] = kst_indicator.kst_sig() # Signal Line Know Sure Thing (KST)\n",
+        "df['dpo'] = ta.trend.dpo(close=df.close) # Detrended Price Oscillator (DPO)\n",
+        "df['trix'] = ta.trend.trix(close=df.close) # Trix (TRIX)\n",
+        "df['sma_10'] = ta.trend.sma_indicator(close=df.close, n=10) # SMA n=10\n",
+        "df['sma_20'] = ta.trend.sma_indicator(close=df.close, n=20) # SMA n=20\n",
+        "df['sma_30'] = ta.trend.sma_indicator(close=df.close, n=30) # SMA n=30\n",
+        "df['sma_60'] = ta.trend.sma_indicator(close=df.close, n=60) # SMA n=60\n",
+        "df['ema_10'] = ta.trend.sma_indicator(close=df.close, n=10) # EMA n=10\n",
+        "df['ema_20'] = ta.trend.sma_indicator(close=df.close, n=20) # EMA n=20\n",
+        "df['ema_30'] = ta.trend.sma_indicator(close=df.close, n=30) # EMA n=30\n",
+        "df['ema_60'] = ta.trend.sma_indicator(close=df.close, n=60) # EMA n=60\n",
+        "\n",
+        "# Volume indicators\n",
+        "df['obv'] = ta.volume.on_balance_volume(close=df.close, volume=df.volume) # On Balance Volume (OBV)\n",
+        "df['vpt'] = ta.volume.volume_price_trend(close=df.close, volume=df.volume) # Volume-price trend (VPT)\n",
+        "df['fi'] = ta.volume.force_index(close=df.close, volume=df.volume) # Force Index (FI)\n",
+        "df['nvi'] = ta.volume.negative_volume_index(close=df.close, volume=df.volume) # Negative Volume Index (NVI)\n",
+        "\n",
+        "df.tail()"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/html": [
+              "<div>\n",
+              "<style scoped>\n",
+              "    .dataframe tbody tr th:only-of-type {\n",
+              "        vertical-align: middle;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe tbody tr th {\n",
+              "        vertical-align: top;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe thead th {\n",
+              "        text-align: right;\n",
+              "    }\n",
+              "</style>\n",
+              "<table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              "    <tr style=\"text-align: right;\">\n",
+              "      <th></th>\n",
+              "      <th>close</th>\n",
+              "      <th>volume</th>\n",
+              "      <th>label</th>\n",
+              "      <th>roc</th>\n",
+              "      <th>rsi</th>\n",
+              "      <th>tsi</th>\n",
+              "      <th>bb_bbhi</th>\n",
+              "      <th>bb_bbli</th>\n",
+              "      <th>aroon_down</th>\n",
+              "      <th>aroon</th>\n",
+              "      <th>aroon_up</th>\n",
+              "      <th>macd_line</th>\n",
+              "      <th>macd_hist</th>\n",
+              "      <th>macd_signal</th>\n",
+              "      <th>kst</th>\n",
+              "      <th>kst_diff</th>\n",
+              "      <th>kst_signal</th>\n",
+              "      <th>dpo</th>\n",
+              "      <th>trix</th>\n",
+              "      <th>sma_10</th>\n",
+              "      <th>sma_20</th>\n",
+              "      <th>sma_30</th>\n",
+              "      <th>sma_60</th>\n",
+              "      <th>ema_10</th>\n",
+              "      <th>ema_20</th>\n",
+              "      <th>ema_30</th>\n",
+              "      <th>ema_60</th>\n",
+              "      <th>obv</th>\n",
+              "      <th>vpt</th>\n",
+              "      <th>fi</th>\n",
+              "      <th>nvi</th>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>date</th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <th>2019-12-31 20:55</th>\n",
+              "      <td>293.590</td>\n",
+              "      <td>6260.0</td>\n",
+              "      <td>0</td>\n",
+              "      <td>0.080108</td>\n",
+              "      <td>66.452076</td>\n",
+              "      <td>12.884774</td>\n",
+              "      <td>1.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>20.0</td>\n",
+              "      <td>80.0</td>\n",
+              "      <td>100.0</td>\n",
+              "      <td>0.065703</td>\n",
+              "      <td>0.004158</td>\n",
+              "      <td>0.061544</td>\n",
+              "      <td>0.656730</td>\n",
+              "      <td>-0.103265</td>\n",
+              "      <td>0.759995</td>\n",
+              "      <td>0.24075</td>\n",
+              "      <td>0.002978</td>\n",
+              "      <td>293.2490</td>\n",
+              "      <td>293.23425</td>\n",
+              "      <td>293.192000</td>\n",
+              "      <td>292.980833</td>\n",
+              "      <td>293.2490</td>\n",
+              "      <td>293.23425</td>\n",
+              "      <td>293.192000</td>\n",
+              "      <td>292.980833</td>\n",
+              "      <td>8353065.0</td>\n",
+              "      <td>7.131644</td>\n",
+              "      <td>271.749266</td>\n",
+              "      <td>1194.559824</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-12-31 20:56</th>\n",
+              "      <td>293.445</td>\n",
+              "      <td>7623.0</td>\n",
+              "      <td>0</td>\n",
+              "      <td>-0.010222</td>\n",
+              "      <td>59.379185</td>\n",
+              "      <td>14.009820</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>16.0</td>\n",
+              "      <td>80.0</td>\n",
+              "      <td>96.0</td>\n",
+              "      <td>0.075545</td>\n",
+              "      <td>0.011200</td>\n",
+              "      <td>0.064344</td>\n",
+              "      <td>0.648568</td>\n",
+              "      <td>-0.088936</td>\n",
+              "      <td>0.737504</td>\n",
+              "      <td>0.18625</td>\n",
+              "      <td>0.003056</td>\n",
+              "      <td>293.2515</td>\n",
+              "      <td>293.25375</td>\n",
+              "      <td>293.201000</td>\n",
+              "      <td>292.999083</td>\n",
+              "      <td>293.2515</td>\n",
+              "      <td>293.25375</td>\n",
+              "      <td>293.201000</td>\n",
+              "      <td>292.999083</td>\n",
+              "      <td>8345442.0</td>\n",
+              "      <td>0.715985</td>\n",
+              "      <td>75.022942</td>\n",
+              "      <td>1194.559824</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-12-31 20:57</th>\n",
+              "      <td>293.370</td>\n",
+              "      <td>5036.0</td>\n",
+              "      <td>1</td>\n",
+              "      <td>-0.023855</td>\n",
+              "      <td>56.055755</td>\n",
+              "      <td>13.635937</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>12.0</td>\n",
+              "      <td>80.0</td>\n",
+              "      <td>92.0</td>\n",
+              "      <td>0.076412</td>\n",
+              "      <td>0.009654</td>\n",
+              "      <td>0.066758</td>\n",
+              "      <td>0.619311</td>\n",
+              "      <td>-0.091696</td>\n",
+              "      <td>0.711008</td>\n",
+              "      <td>0.15375</td>\n",
+              "      <td>0.003134</td>\n",
+              "      <td>293.2525</td>\n",
+              "      <td>293.26625</td>\n",
+              "      <td>293.206667</td>\n",
+              "      <td>293.017167</td>\n",
+              "      <td>293.2525</td>\n",
+              "      <td>293.26625</td>\n",
+              "      <td>293.206667</td>\n",
+              "      <td>293.017167</td>\n",
+              "      <td>8340406.0</td>\n",
+              "      <td>-5.052017</td>\n",
+              "      <td>10.348236</td>\n",
+              "      <td>1194.254513</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-12-31 20:58</th>\n",
+              "      <td>293.450</td>\n",
+              "      <td>5485.0</td>\n",
+              "      <td>1</td>\n",
+              "      <td>0.010224</td>\n",
+              "      <td>58.710399</td>\n",
+              "      <td>14.289597</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>8.0</td>\n",
+              "      <td>80.0</td>\n",
+              "      <td>88.0</td>\n",
+              "      <td>0.082602</td>\n",
+              "      <td>0.012676</td>\n",
+              "      <td>0.069927</td>\n",
+              "      <td>0.626898</td>\n",
+              "      <td>-0.057242</td>\n",
+              "      <td>0.684140</td>\n",
+              "      <td>0.07450</td>\n",
+              "      <td>0.003255</td>\n",
+              "      <td>293.2705</td>\n",
+              "      <td>293.28550</td>\n",
+              "      <td>293.214000</td>\n",
+              "      <td>293.036583</td>\n",
+              "      <td>293.2705</td>\n",
+              "      <td>293.28550</td>\n",
+              "      <td>293.214000</td>\n",
+              "      <td>293.036583</td>\n",
+              "      <td>8345891.0</td>\n",
+              "      <td>0.208598</td>\n",
+              "      <td>71.555631</td>\n",
+              "      <td>1194.254513</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-12-31 20:59</th>\n",
+              "      <td>293.620</td>\n",
+              "      <td>4139.0</td>\n",
+              "      <td>1</td>\n",
+              "      <td>0.088628</td>\n",
+              "      <td>63.725194</td>\n",
+              "      <td>16.667267</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>4.0</td>\n",
+              "      <td>96.0</td>\n",
+              "      <td>100.0</td>\n",
+              "      <td>0.100072</td>\n",
+              "      <td>0.024116</td>\n",
+              "      <td>0.075956</td>\n",
+              "      <td>0.663379</td>\n",
+              "      <td>0.000775</td>\n",
+              "      <td>0.662605</td>\n",
+              "      <td>-0.04275</td>\n",
+              "      <td>0.003506</td>\n",
+              "      <td>293.3100</td>\n",
+              "      <td>293.31275</td>\n",
+              "      <td>293.229000</td>\n",
+              "      <td>293.058167</td>\n",
+              "      <td>293.3100</td>\n",
+              "      <td>293.31275</td>\n",
+              "      <td>293.229000</td>\n",
+              "      <td>293.058167</td>\n",
+              "      <td>8350030.0</td>\n",
+              "      <td>3.893507</td>\n",
+              "      <td>161.851969</td>\n",
+              "      <td>1194.946362</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n",
+              "</div>"
+            ],
+            "text/plain": [
+              "                    close  volume  label  ...       vpt          fi          nvi\n",
+              "date                                      ...                                   \n",
+              "2019-12-31 20:55  293.590  6260.0      0  ...  7.131644  271.749266  1194.559824\n",
+              "2019-12-31 20:56  293.445  7623.0      0  ...  0.715985   75.022942  1194.559824\n",
+              "2019-12-31 20:57  293.370  5036.0      1  ... -5.052017   10.348236  1194.254513\n",
+              "2019-12-31 20:58  293.450  5485.0      1  ...  0.208598   71.555631  1194.254513\n",
+              "2019-12-31 20:59  293.620  4139.0      1  ...  3.893507  161.851969  1194.946362\n",
+              "\n",
+              "[5 rows x 31 columns]"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 7
+        }
+      ]
+    },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "DtT-QGfdwwvn",
+        "colab_type": "text"
+      },
+      "source": [
+        "**Datetime cyclical encoding**\n",
+        "\n",
+        "$$x_{sin} = \\sin(\\frac{2*\\pi*x}{max(x)})$$\n",
+        "\n",
+        "$$x_{cos} = \\cos(\\frac{2*\\pi*x}{max(x)})$$"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "uRbPhrMZ07I2",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 442
+        },
+        "outputId": "a04862d1-4438-4388-aeb0-da8c82862677"
+      },
+      "source": [
+        "df['datetime'] = df.index.to_timestamp()\n",
+        "df['min_sin'] = np.sin(2 * np.pi * df.datetime.dt.minute / 60)\n",
+        "df['min_cos'] = np.cos(2 * np.pi * df.datetime.dt.minute / 60)\n",
+        "df['hour_sin'] = np.sin(2 * np.pi * df.datetime.dt.hour / 60)\n",
+        "df['hour_cos'] = np.cos(2 * np.pi * df.datetime.dt.hour / 60)\n",
+        "df['day_sin'] = np.sin(2 * np.pi * df.datetime.dt.day / 30)\n",
+        "df['day_cos'] = np.cos(2 * np.pi * df.datetime.dt.day / 30)\n",
+        "df['month_sin'] = np.sin(2 * np.pi * df.datetime.dt.month / 12)\n",
+        "df['month_cos'] = np.cos(2 * np.pi * df.datetime.dt.month / 12)\n",
+        "\n",
+        "df = df.drop(['datetime'], axis=1)\n",
+        "print(df.shape)\n",
+        "df.tail()"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "(101081, 39)\n"
+          ],
+          "name": "stdout"
+        },
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/html": [
+              "<div>\n",
+              "<style scoped>\n",
+              "    .dataframe tbody tr th:only-of-type {\n",
+              "        vertical-align: middle;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe tbody tr th {\n",
+              "        vertical-align: top;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe thead th {\n",
+              "        text-align: right;\n",
+              "    }\n",
+              "</style>\n",
+              "<table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              "    <tr style=\"text-align: right;\">\n",
+              "      <th></th>\n",
+              "      <th>close</th>\n",
+              "      <th>volume</th>\n",
+              "      <th>label</th>\n",
+              "      <th>roc</th>\n",
+              "      <th>rsi</th>\n",
+              "      <th>tsi</th>\n",
+              "      <th>bb_bbhi</th>\n",
+              "      <th>bb_bbli</th>\n",
+              "      <th>aroon_down</th>\n",
+              "      <th>aroon</th>\n",
+              "      <th>aroon_up</th>\n",
+              "      <th>macd_line</th>\n",
+              "      <th>macd_hist</th>\n",
+              "      <th>macd_signal</th>\n",
+              "      <th>kst</th>\n",
+              "      <th>kst_diff</th>\n",
+              "      <th>kst_signal</th>\n",
+              "      <th>dpo</th>\n",
+              "      <th>trix</th>\n",
+              "      <th>sma_10</th>\n",
+              "      <th>sma_20</th>\n",
+              "      <th>sma_30</th>\n",
+              "      <th>sma_60</th>\n",
+              "      <th>ema_10</th>\n",
+              "      <th>ema_20</th>\n",
+              "      <th>ema_30</th>\n",
+              "      <th>ema_60</th>\n",
+              "      <th>obv</th>\n",
+              "      <th>vpt</th>\n",
+              "      <th>fi</th>\n",
+              "      <th>nvi</th>\n",
+              "      <th>min_sin</th>\n",
+              "      <th>min_cos</th>\n",
+              "      <th>hour_sin</th>\n",
+              "      <th>hour_cos</th>\n",
+              "      <th>day_sin</th>\n",
+              "      <th>day_cos</th>\n",
+              "      <th>month_sin</th>\n",
+              "      <th>month_cos</th>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>date</th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <th>2019-12-31 20:55</th>\n",
+              "      <td>293.590</td>\n",
+              "      <td>6260.0</td>\n",
+              "      <td>0</td>\n",
+              "      <td>0.080108</td>\n",
+              "      <td>66.452076</td>\n",
+              "      <td>12.884774</td>\n",
+              "      <td>1.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>20.0</td>\n",
+              "      <td>80.0</td>\n",
+              "      <td>100.0</td>\n",
+              "      <td>0.065703</td>\n",
+              "      <td>0.004158</td>\n",
+              "      <td>0.061544</td>\n",
+              "      <td>0.656730</td>\n",
+              "      <td>-0.103265</td>\n",
+              "      <td>0.759995</td>\n",
+              "      <td>0.24075</td>\n",
+              "      <td>0.002978</td>\n",
+              "      <td>293.2490</td>\n",
+              "      <td>293.23425</td>\n",
+              "      <td>293.192000</td>\n",
+              "      <td>292.980833</td>\n",
+              "      <td>293.2490</td>\n",
+              "      <td>293.23425</td>\n",
+              "      <td>293.192000</td>\n",
+              "      <td>292.980833</td>\n",
+              "      <td>8353065.0</td>\n",
+              "      <td>7.131644</td>\n",
+              "      <td>271.749266</td>\n",
+              "      <td>1194.559824</td>\n",
+              "      <td>-0.500000</td>\n",
+              "      <td>0.866025</td>\n",
+              "      <td>0.866025</td>\n",
+              "      <td>-0.5</td>\n",
+              "      <td>0.207912</td>\n",
+              "      <td>0.978148</td>\n",
+              "      <td>-2.449294e-16</td>\n",
+              "      <td>1.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-12-31 20:56</th>\n",
+              "      <td>293.445</td>\n",
+              "      <td>7623.0</td>\n",
+              "      <td>0</td>\n",
+              "      <td>-0.010222</td>\n",
+              "      <td>59.379185</td>\n",
+              "      <td>14.009820</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>16.0</td>\n",
+              "      <td>80.0</td>\n",
+              "      <td>96.0</td>\n",
+              "      <td>0.075545</td>\n",
+              "      <td>0.011200</td>\n",
+              "      <td>0.064344</td>\n",
+              "      <td>0.648568</td>\n",
+              "      <td>-0.088936</td>\n",
+              "      <td>0.737504</td>\n",
+              "      <td>0.18625</td>\n",
+              "      <td>0.003056</td>\n",
+              "      <td>293.2515</td>\n",
+              "      <td>293.25375</td>\n",
+              "      <td>293.201000</td>\n",
+              "      <td>292.999083</td>\n",
+              "      <td>293.2515</td>\n",
+              "      <td>293.25375</td>\n",
+              "      <td>293.201000</td>\n",
+              "      <td>292.999083</td>\n",
+              "      <td>8345442.0</td>\n",
+              "      <td>0.715985</td>\n",
+              "      <td>75.022942</td>\n",
+              "      <td>1194.559824</td>\n",
+              "      <td>-0.406737</td>\n",
+              "      <td>0.913545</td>\n",
+              "      <td>0.866025</td>\n",
+              "      <td>-0.5</td>\n",
+              "      <td>0.207912</td>\n",
+              "      <td>0.978148</td>\n",
+              "      <td>-2.449294e-16</td>\n",
+              "      <td>1.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-12-31 20:57</th>\n",
+              "      <td>293.370</td>\n",
+              "      <td>5036.0</td>\n",
+              "      <td>1</td>\n",
+              "      <td>-0.023855</td>\n",
+              "      <td>56.055755</td>\n",
+              "      <td>13.635937</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>12.0</td>\n",
+              "      <td>80.0</td>\n",
+              "      <td>92.0</td>\n",
+              "      <td>0.076412</td>\n",
+              "      <td>0.009654</td>\n",
+              "      <td>0.066758</td>\n",
+              "      <td>0.619311</td>\n",
+              "      <td>-0.091696</td>\n",
+              "      <td>0.711008</td>\n",
+              "      <td>0.15375</td>\n",
+              "      <td>0.003134</td>\n",
+              "      <td>293.2525</td>\n",
+              "      <td>293.26625</td>\n",
+              "      <td>293.206667</td>\n",
+              "      <td>293.017167</td>\n",
+              "      <td>293.2525</td>\n",
+              "      <td>293.26625</td>\n",
+              "      <td>293.206667</td>\n",
+              "      <td>293.017167</td>\n",
+              "      <td>8340406.0</td>\n",
+              "      <td>-5.052017</td>\n",
+              "      <td>10.348236</td>\n",
+              "      <td>1194.254513</td>\n",
+              "      <td>-0.309017</td>\n",
+              "      <td>0.951057</td>\n",
+              "      <td>0.866025</td>\n",
+              "      <td>-0.5</td>\n",
+              "      <td>0.207912</td>\n",
+              "      <td>0.978148</td>\n",
+              "      <td>-2.449294e-16</td>\n",
+              "      <td>1.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-12-31 20:58</th>\n",
+              "      <td>293.450</td>\n",
+              "      <td>5485.0</td>\n",
+              "      <td>1</td>\n",
+              "      <td>0.010224</td>\n",
+              "      <td>58.710399</td>\n",
+              "      <td>14.289597</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>8.0</td>\n",
+              "      <td>80.0</td>\n",
+              "      <td>88.0</td>\n",
+              "      <td>0.082602</td>\n",
+              "      <td>0.012676</td>\n",
+              "      <td>0.069927</td>\n",
+              "      <td>0.626898</td>\n",
+              "      <td>-0.057242</td>\n",
+              "      <td>0.684140</td>\n",
+              "      <td>0.07450</td>\n",
+              "      <td>0.003255</td>\n",
+              "      <td>293.2705</td>\n",
+              "      <td>293.28550</td>\n",
+              "      <td>293.214000</td>\n",
+              "      <td>293.036583</td>\n",
+              "      <td>293.2705</td>\n",
+              "      <td>293.28550</td>\n",
+              "      <td>293.214000</td>\n",
+              "      <td>293.036583</td>\n",
+              "      <td>8345891.0</td>\n",
+              "      <td>0.208598</td>\n",
+              "      <td>71.555631</td>\n",
+              "      <td>1194.254513</td>\n",
+              "      <td>-0.207912</td>\n",
+              "      <td>0.978148</td>\n",
+              "      <td>0.866025</td>\n",
+              "      <td>-0.5</td>\n",
+              "      <td>0.207912</td>\n",
+              "      <td>0.978148</td>\n",
+              "      <td>-2.449294e-16</td>\n",
+              "      <td>1.0</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-12-31 20:59</th>\n",
+              "      <td>293.620</td>\n",
+              "      <td>4139.0</td>\n",
+              "      <td>1</td>\n",
+              "      <td>0.088628</td>\n",
+              "      <td>63.725194</td>\n",
+              "      <td>16.667267</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>4.0</td>\n",
+              "      <td>96.0</td>\n",
+              "      <td>100.0</td>\n",
+              "      <td>0.100072</td>\n",
+              "      <td>0.024116</td>\n",
+              "      <td>0.075956</td>\n",
+              "      <td>0.663379</td>\n",
+              "      <td>0.000775</td>\n",
+              "      <td>0.662605</td>\n",
+              "      <td>-0.04275</td>\n",
+              "      <td>0.003506</td>\n",
+              "      <td>293.3100</td>\n",
+              "      <td>293.31275</td>\n",
+              "      <td>293.229000</td>\n",
+              "      <td>293.058167</td>\n",
+              "      <td>293.3100</td>\n",
+              "      <td>293.31275</td>\n",
+              "      <td>293.229000</td>\n",
+              "      <td>293.058167</td>\n",
+              "      <td>8350030.0</td>\n",
+              "      <td>3.893507</td>\n",
+              "      <td>161.851969</td>\n",
+              "      <td>1194.946362</td>\n",
+              "      <td>-0.104528</td>\n",
+              "      <td>0.994522</td>\n",
+              "      <td>0.866025</td>\n",
+              "      <td>-0.5</td>\n",
+              "      <td>0.207912</td>\n",
+              "      <td>0.978148</td>\n",
+              "      <td>-2.449294e-16</td>\n",
+              "      <td>1.0</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n",
+              "</div>"
+            ],
+            "text/plain": [
+              "                    close  volume  label  ...   day_cos     month_sin  month_cos\n",
+              "date                                      ...                                   \n",
+              "2019-12-31 20:55  293.590  6260.0      0  ...  0.978148 -2.449294e-16        1.0\n",
+              "2019-12-31 20:56  293.445  7623.0      0  ...  0.978148 -2.449294e-16        1.0\n",
+              "2019-12-31 20:57  293.370  5036.0      1  ...  0.978148 -2.449294e-16        1.0\n",
+              "2019-12-31 20:58  293.450  5485.0      1  ...  0.978148 -2.449294e-16        1.0\n",
+              "2019-12-31 20:59  293.620  4139.0      1  ...  0.978148 -2.449294e-16        1.0\n",
+              "\n",
+              "[5 rows x 39 columns]"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 8
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "mmkRpUsR2IAm",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 442
+        },
+        "outputId": "599d5571-a718-4d77-b170-29bb1fc23041"
+      },
+      "source": [
+        "df_na = df.dropna(axis=0)\n",
+        "print(df_na.shape)\n",
+        "df_na.head()"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "(101022, 39)\n"
+          ],
+          "name": "stdout"
+        },
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/html": [
+              "<div>\n",
+              "<style scoped>\n",
+              "    .dataframe tbody tr th:only-of-type {\n",
+              "        vertical-align: middle;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe tbody tr th {\n",
+              "        vertical-align: top;\n",
+              "    }\n",
+              "\n",
+              "    .dataframe thead th {\n",
+              "        text-align: right;\n",
+              "    }\n",
+              "</style>\n",
+              "<table border=\"1\" class=\"dataframe\">\n",
+              "  <thead>\n",
+              "    <tr style=\"text-align: right;\">\n",
+              "      <th></th>\n",
+              "      <th>close</th>\n",
+              "      <th>volume</th>\n",
+              "      <th>label</th>\n",
+              "      <th>roc</th>\n",
+              "      <th>rsi</th>\n",
+              "      <th>tsi</th>\n",
+              "      <th>bb_bbhi</th>\n",
+              "      <th>bb_bbli</th>\n",
+              "      <th>aroon_down</th>\n",
+              "      <th>aroon</th>\n",
+              "      <th>aroon_up</th>\n",
+              "      <th>macd_line</th>\n",
+              "      <th>macd_hist</th>\n",
+              "      <th>macd_signal</th>\n",
+              "      <th>kst</th>\n",
+              "      <th>kst_diff</th>\n",
+              "      <th>kst_signal</th>\n",
+              "      <th>dpo</th>\n",
+              "      <th>trix</th>\n",
+              "      <th>sma_10</th>\n",
+              "      <th>sma_20</th>\n",
+              "      <th>sma_30</th>\n",
+              "      <th>sma_60</th>\n",
+              "      <th>ema_10</th>\n",
+              "      <th>ema_20</th>\n",
+              "      <th>ema_30</th>\n",
+              "      <th>ema_60</th>\n",
+              "      <th>obv</th>\n",
+              "      <th>vpt</th>\n",
+              "      <th>fi</th>\n",
+              "      <th>nvi</th>\n",
+              "      <th>min_sin</th>\n",
+              "      <th>min_cos</th>\n",
+              "      <th>hour_sin</th>\n",
+              "      <th>hour_cos</th>\n",
+              "      <th>day_sin</th>\n",
+              "      <th>day_cos</th>\n",
+              "      <th>month_sin</th>\n",
+              "      <th>month_cos</th>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>date</th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "      <th></th>\n",
+              "    </tr>\n",
+              "  </thead>\n",
+              "  <tbody>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 15:29</th>\n",
+              "      <td>155.765</td>\n",
+              "      <td>1538.0</td>\n",
+              "      <td>1</td>\n",
+              "      <td>0.077099</td>\n",
+              "      <td>55.238751</td>\n",
+              "      <td>29.670500</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>4.0</td>\n",
+              "      <td>80.0</td>\n",
+              "      <td>84.0</td>\n",
+              "      <td>0.176555</td>\n",
+              "      <td>-0.012739</td>\n",
+              "      <td>0.189295</td>\n",
+              "      <td>4.072616</td>\n",
+              "      <td>-0.366435</td>\n",
+              "      <td>4.439051</td>\n",
+              "      <td>-0.03600</td>\n",
+              "      <td>0.018094</td>\n",
+              "      <td>155.8260</td>\n",
+              "      <td>155.72600</td>\n",
+              "      <td>155.498833</td>\n",
+              "      <td>155.187667</td>\n",
+              "      <td>155.8260</td>\n",
+              "      <td>155.72600</td>\n",
+              "      <td>155.498833</td>\n",
+              "      <td>155.187667</td>\n",
+              "      <td>12576.0</td>\n",
+              "      <td>-0.489252</td>\n",
+              "      <td>-24.613028</td>\n",
+              "      <td>1012.224809</td>\n",
+              "      <td>1.045285e-01</td>\n",
+              "      <td>-0.994522</td>\n",
+              "      <td>1.0</td>\n",
+              "      <td>2.832769e-16</td>\n",
+              "      <td>0.406737</td>\n",
+              "      <td>0.913545</td>\n",
+              "      <td>0.5</td>\n",
+              "      <td>0.866025</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 15:30</th>\n",
+              "      <td>155.935</td>\n",
+              "      <td>1765.0</td>\n",
+              "      <td>0</td>\n",
+              "      <td>0.157364</td>\n",
+              "      <td>59.659759</td>\n",
+              "      <td>28.481802</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>12.0</td>\n",
+              "      <td>68.0</td>\n",
+              "      <td>80.0</td>\n",
+              "      <td>0.174976</td>\n",
+              "      <td>-0.011455</td>\n",
+              "      <td>0.186431</td>\n",
+              "      <td>4.052878</td>\n",
+              "      <td>-0.344026</td>\n",
+              "      <td>4.396904</td>\n",
+              "      <td>-0.05000</td>\n",
+              "      <td>0.017853</td>\n",
+              "      <td>155.8505</td>\n",
+              "      <td>155.74000</td>\n",
+              "      <td>155.536500</td>\n",
+              "      <td>155.206917</td>\n",
+              "      <td>155.8505</td>\n",
+              "      <td>155.74000</td>\n",
+              "      <td>155.536500</td>\n",
+              "      <td>155.206917</td>\n",
+              "      <td>14341.0</td>\n",
+              "      <td>0.200315</td>\n",
+              "      <td>21.767405</td>\n",
+              "      <td>1012.224809</td>\n",
+              "      <td>5.665539e-16</td>\n",
+              "      <td>-1.000000</td>\n",
+              "      <td>1.0</td>\n",
+              "      <td>2.832769e-16</td>\n",
+              "      <td>0.406737</td>\n",
+              "      <td>0.913545</td>\n",
+              "      <td>0.5</td>\n",
+              "      <td>0.866025</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 15:31</th>\n",
+              "      <td>155.740</td>\n",
+              "      <td>767.0</td>\n",
+              "      <td>1</td>\n",
+              "      <td>0.032115</td>\n",
+              "      <td>53.172296</td>\n",
+              "      <td>25.296160</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>8.0</td>\n",
+              "      <td>68.0</td>\n",
+              "      <td>76.0</td>\n",
+              "      <td>0.156189</td>\n",
+              "      <td>-0.024194</td>\n",
+              "      <td>0.180382</td>\n",
+              "      <td>3.948436</td>\n",
+              "      <td>-0.377154</td>\n",
+              "      <td>4.325591</td>\n",
+              "      <td>-0.06400</td>\n",
+              "      <td>0.017344</td>\n",
+              "      <td>155.8555</td>\n",
+              "      <td>155.75400</td>\n",
+              "      <td>155.569833</td>\n",
+              "      <td>155.213833</td>\n",
+              "      <td>155.8555</td>\n",
+              "      <td>155.75400</td>\n",
+              "      <td>155.569833</td>\n",
+              "      <td>155.213833</td>\n",
+              "      <td>13574.0</td>\n",
+              "      <td>0.967150</td>\n",
+              "      <td>-2.708653</td>\n",
+              "      <td>1010.959000</td>\n",
+              "      <td>-1.045285e-01</td>\n",
+              "      <td>-0.994522</td>\n",
+              "      <td>1.0</td>\n",
+              "      <td>2.832769e-16</td>\n",
+              "      <td>0.406737</td>\n",
+              "      <td>0.913545</td>\n",
+              "      <td>0.5</td>\n",
+              "      <td>0.866025</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 15:32</th>\n",
+              "      <td>155.820</td>\n",
+              "      <td>1805.0</td>\n",
+              "      <td>0</td>\n",
+              "      <td>0.083499</td>\n",
+              "      <td>55.318926</td>\n",
+              "      <td>23.380278</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>4.0</td>\n",
+              "      <td>68.0</td>\n",
+              "      <td>72.0</td>\n",
+              "      <td>0.146071</td>\n",
+              "      <td>-0.027449</td>\n",
+              "      <td>0.173520</td>\n",
+              "      <td>3.782034</td>\n",
+              "      <td>-0.453795</td>\n",
+              "      <td>4.235828</td>\n",
+              "      <td>-0.07475</td>\n",
+              "      <td>0.016742</td>\n",
+              "      <td>155.8550</td>\n",
+              "      <td>155.76475</td>\n",
+              "      <td>155.606667</td>\n",
+              "      <td>155.230000</td>\n",
+              "      <td>155.8550</td>\n",
+              "      <td>155.76475</td>\n",
+              "      <td>155.606667</td>\n",
+              "      <td>155.230000</td>\n",
+              "      <td>15379.0</td>\n",
+              "      <td>-0.031963</td>\n",
+              "      <td>18.306869</td>\n",
+              "      <td>1010.959000</td>\n",
+              "      <td>-2.079117e-01</td>\n",
+              "      <td>-0.978148</td>\n",
+              "      <td>1.0</td>\n",
+              "      <td>2.832769e-16</td>\n",
+              "      <td>0.406737</td>\n",
+              "      <td>0.913545</td>\n",
+              "      <td>0.5</td>\n",
+              "      <td>0.866025</td>\n",
+              "    </tr>\n",
+              "    <tr>\n",
+              "      <th>2019-01-02 15:33</th>\n",
+              "      <td>155.695</td>\n",
+              "      <td>740.0</td>\n",
+              "      <td>1</td>\n",
+              "      <td>0.003212</td>\n",
+              "      <td>51.357405</td>\n",
+              "      <td>20.516270</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>0.0</td>\n",
+              "      <td>12.0</td>\n",
+              "      <td>56.0</td>\n",
+              "      <td>68.0</td>\n",
+              "      <td>0.126508</td>\n",
+              "      <td>-0.037609</td>\n",
+              "      <td>0.164118</td>\n",
+              "      <td>3.544114</td>\n",
+              "      <td>-0.576064</td>\n",
+              "      <td>4.120178</td>\n",
+              "      <td>0.05925</td>\n",
+              "      <td>0.015916</td>\n",
+              "      <td>155.8560</td>\n",
+              "      <td>155.76575</td>\n",
+              "      <td>155.639333</td>\n",
+              "      <td>155.248250</td>\n",
+              "      <td>155.8560</td>\n",
+              "      <td>155.76575</td>\n",
+              "      <td>155.639333</td>\n",
+              "      <td>155.248250</td>\n",
+              "      <td>14639.0</td>\n",
+              "      <td>0.333553</td>\n",
+              "      <td>2.477316</td>\n",
+              "      <td>1010.148001</td>\n",
+              "      <td>-3.090170e-01</td>\n",
+              "      <td>-0.951057</td>\n",
+              "      <td>1.0</td>\n",
+              "      <td>2.832769e-16</td>\n",
+              "      <td>0.406737</td>\n",
+              "      <td>0.913545</td>\n",
+              "      <td>0.5</td>\n",
+              "      <td>0.866025</td>\n",
+              "    </tr>\n",
+              "  </tbody>\n",
+              "</table>\n",
+              "</div>"
+            ],
+            "text/plain": [
+              "                    close  volume  label  ...   day_cos  month_sin  month_cos\n",
+              "date                                      ...                                \n",
+              "2019-01-02 15:29  155.765  1538.0      1  ...  0.913545        0.5   0.866025\n",
+              "2019-01-02 15:30  155.935  1765.0      0  ...  0.913545        0.5   0.866025\n",
+              "2019-01-02 15:31  155.740   767.0      1  ...  0.913545        0.5   0.866025\n",
+              "2019-01-02 15:32  155.820  1805.0      0  ...  0.913545        0.5   0.866025\n",
+              "2019-01-02 15:33  155.695   740.0      1  ...  0.913545        0.5   0.866025\n",
+              "\n",
+              "[5 rows x 39 columns]"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 9
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "wbd8i3CNzs_6",
+        "colab_type": "code",
+        "colab": {}
+      },
+      "source": [
+        "labels = df_na.label\n",
+        "df_na = df_na.drop(['label'], axis=1)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "FV5yPf1s4_EL",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 136
+        },
+        "outputId": "11a849ba-67bf-4868-8617-ec89811b41a0"
+      },
+      "source": [
+        "df_na.columns"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/plain": [
+              "Index(['close', 'volume', 'roc', 'rsi', 'tsi', 'bb_bbhi', 'bb_bbli',\n",
+              "       'aroon_down', 'aroon', 'aroon_up', 'macd_line', 'macd_hist',\n",
+              "       'macd_signal', 'kst', 'kst_diff', 'kst_signal', 'dpo', 'trix', 'sma_10',\n",
+              "       'sma_20', 'sma_30', 'sma_60', 'ema_10', 'ema_20', 'ema_30', 'ema_60',\n",
+              "       'obv', 'vpt', 'fi', 'nvi', 'min_sin', 'min_cos', 'hour_sin', 'hour_cos',\n",
+              "       'day_sin', 'day_cos', 'month_sin', 'month_cos'],\n",
+              "      dtype='object')"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 11
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "JXItrTrS2ub0",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 34
+        },
+        "outputId": "2a043371-ccdd-4e9e-94a2-ed11dcd194fc"
+      },
+      "source": [
+        "X_train, X_test, y_train, y_test = train_test_split(df_na.values, labels.values, test_size=0.05, random_state=42)\n",
+        "X_train.shape, X_test.shape, y_train.shape, y_test.shape"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/plain": [
+              "((95970, 38), (5052, 38), (95970,), (5052,))"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 12
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "sIJSJNW75Kog",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 34
+        },
+        "outputId": "709bba3f-1769-415b-f42f-c2a6fe606982"
+      },
+      "source": [
+        "scaler = StandardScaler()\n",
+        "scaler.fit(X_train)"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/plain": [
+              "StandardScaler(copy=True, with_mean=True, with_std=True)"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 13
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "gSSNnMFA5dCd",
+        "colab_type": "code",
+        "colab": {}
+      },
+      "source": [
+        "X_train_scaled = scaler.transform(X_train)\n",
+        "X_test_scaled = scaler.transform(X_test)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "48fcB-RX5k_a",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 51
+        },
+        "outputId": "92abcade-7862-4b8a-e320-3fa75cc3439c"
+      },
+      "source": [
+        "pca = PCA(n_components=0.8, random_state=42)\n",
+        "pca.fit(X_train_scaled)"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/plain": [
+              "PCA(copy=True, iterated_power='auto', n_components=0.8, random_state=42,\n",
+              "    svd_solver='auto', tol=0.0, whiten=False)"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 15
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "ZQVfl8Yz6LLu",
+        "colab_type": "code",
+        "colab": {}
+      },
+      "source": [
+        "X_train_pca = pca.transform(X_train_scaled)\n",
+        "X_test_pca = pca.transform(X_test_scaled)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "zt0c2ae46u0S",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 34
+        },
+        "outputId": "e46ce866-7bfa-430a-db9b-3488cc11b5ee"
+      },
+      "source": [
+        "X_train_pca.shape, X_test_pca.shape"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "execute_result",
+          "data": {
+            "text/plain": [
+              "((95970, 10), (5052, 10))"
+            ]
+          },
+          "metadata": {
+            "tags": []
+          },
+          "execution_count": 17
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "38ZISGqG6yWD",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 34
+        },
+        "outputId": "676c96f7-bff5-47fc-eb09-a4ae1118ca97"
+      },
+      "source": [
+        "model = LogisticRegression()\n",
+        "model.fit(X_train_pca, y_train)\n",
+        "y_pred = model.predict_proba(X_test_pca)\n",
+        "acc = accuracy_score(y_test, y_pred.argmax(axis=1))\n",
+        "f1 = f1_score(y_test, y_pred.argmax(axis=1))\n",
+        "roc = roc_auc_score(y_test, y_pred[:, 1])\n",
+        "print(f'LogisticRegression: acc={acc*100:.2f}% - f1={f1*100:.2f}% - roc={roc*100:.2f}%')"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "LogisticRegression: acc=56.57% - f1=71.40% - roc=54.00%\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "MQ5ZHLbg_Kbo",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 34
+        },
+        "outputId": "567ea292-8ee8-42e8-930d-3baa60067ded"
+      },
+      "source": [
+        "model = DecisionTreeClassifier()\n",
+        "model.fit(X_train_pca, y_train)\n",
+        "y_pred = model.predict_proba(X_test_pca)\n",
+        "acc = accuracy_score(y_test, y_pred.argmax(axis=1))\n",
+        "f1 = f1_score(y_test, y_pred.argmax(axis=1))\n",
+        "roc = roc_auc_score(y_test, y_pred[:, 1])\n",
+        "print(f'LogisticRegression: acc={acc*100:.2f}% - f1={f1*100:.2f}% - roc={roc*100:.2f}%')"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "LogisticRegression: acc=53.42% - f1=59.31% - roc=52.43%\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "NzTQbksY_8_U",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 34
+        },
+        "outputId": "83b89cdf-6a4f-46ac-d717-e40ddb33b29e"
+      },
+      "source": [
+        "model = RandomForestClassifier()\n",
+        "model.fit(X_train_pca, y_train)\n",
+        "y_pred = model.predict_proba(X_test_pca)\n",
+        "acc = accuracy_score(y_test, y_pred.argmax(axis=1))\n",
+        "f1 = f1_score(y_test, y_pred.argmax(axis=1))\n",
+        "roc = roc_auc_score(y_test, y_pred[:, 1])\n",
+        "print(f'RandomForestClassifier: acc={acc*100:.2f}% - f1={f1*100:.2f}% - roc={roc*100:.2f}%')"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "RandomForest: acc=55.19% - f1=62.85% - roc=56.71%\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "5r7tdrYUARXv",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 34
+        },
+        "outputId": "3646033b-5891-4236-e5fd-23685f26bf79"
+      },
+      "source": [
+        "model = GradientBoostingClassifier()\n",
+        "model.fit(X_train_pca, y_train)\n",
+        "y_pred = model.predict_proba(X_test_pca)\n",
+        "acc = accuracy_score(y_test, y_pred.argmax(axis=1))\n",
+        "f1 = f1_score(y_test, y_pred.argmax(axis=1))\n",
+        "roc = roc_auc_score(y_test, y_pred[:, 1])\n",
+        "print(f'GradientBoostingClassifier: acc={acc*100:.2f}% - f1={f1*100:.2f}% - roc={roc*100:.2f}%')"
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "GradientBoostingClassifier: acc=56.77% - f1=71.75% - roc=56.97%\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "aO7TrJ4XCFhM",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 34
+        },
+        "outputId": "da995af5-5b01-45e3-faa5-a846a8890c95"
+      },
+      "source": [
+        ""
+      ],
+      "execution_count": null,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "/bin/bash: conda: command not found\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    }
+  ]
+}
\ No newline at end of file
diff --git a/Beta-L/Web_scrapping/search_queries.txt b/Beta-L/Web_scrapping/search_queries.txt
new file mode 100644
index 0000000..4eb682a
--- /dev/null
+++ b/Beta-L/Web_scrapping/search_queries.txt
@@ -0,0 +1,45 @@
+SEBI regulations explained
+SEBI guidelines for investors
+SEBI compliance tips
+SEBI rules for stock market
+SEBI regulations simplified
+best mutual funds to invest in
+mutual fund investment tips
+mutual funds explained
+SEBI guidelines for mutual funds
+mutual funds expert advice
+stock market analysis tutorial
+technical analysis of stocks
+fundamental analysis of stocks
+SEBI regulations for stock analysis
+stock market tips from experts
+personal finance planning tips
+investment planning strategies
+financial goals setting
+SEBI guidelines for financial planning
+financial planning for beginners
+best trading strategies explained
+intraday trading tips and tricks
+swing trading techniques
+SEBI regulations for trading
+successful trading strategies
+investment trading influencer
+finance and trading influencer
+investment expert
+stock market guru
+crypto trading influencer
+forex trading expert
+options trading influencer
+day trading guru
+technical analysis expert
+long-term investing influencer
+value investing guru
+dividend investing expert
+swing trading influencer
+market analysis influencer
+economic trends expert
+macroeconomic analysis guru
+financial literacy influencer
+investing basics expert
+trading tutorials guru
+
diff --git a/Beta-L/Web_scrapping/web_scrapping b/Beta-L/Web_scrapping/web_scrapping
new file mode 100644
index 0000000..6a9d4c1
--- /dev/null
+++ b/Beta-L/Web_scrapping/web_scrapping
@@ -0,0 +1,124 @@
+import mysql.connector
+from googleapiclient.discovery import build
+from pytube import YouTube
+
+# MySQL database connection parameters
+import ssl
+
+# Disable SSL certificate verification
+ssl._create_default_https_context = ssl._create_unverified_context
+
+
+db_params = {
+    "host": "sebi-hackathon.mysql.database.azure.com",
+    "user": "mysql",
+    "password": "Betateam-L",
+    "database": "youtube_data"
+}
+
+# YouTube Data API key
+api_key = "AIzaSyD8Eo2iz2butc0qZN6EHRdHlRAy__9FJ6Y"
+
+# Create a MySQL database connection
+db_connection = mysql.connector.connect(**db_params)
+db_connection.set_charset_collation('utf8mb4', 'utf8mb4_unicode_ci')
+db_cursor = db_connection.cursor()
+
+def video_exists(video_url):
+    select_query = "SELECT COUNT(*) FROM youtube_videos WHERE video_url = %s"
+    db_cursor.execute(select_query, (video_url,))
+    count = db_cursor.fetchone()[0]
+    return count > 0
+
+
+def extract_and_store_youtube_data(video_url):
+    try:
+        # Create a YouTube object
+        yt = YouTube(video_url)
+        video_id = yt.video_id
+
+        if not video_exists(video_id):
+            # Extract video details
+            video_title = yt.title
+            video_description = yt.description
+
+            # Fetch video metrics using YouTube Data API
+            youtube = build("youtube", "v3", developerKey=api_key)
+            response = youtube.videos().list(part="statistics,snippet", id=video_id).execute()
+            video_stats = response["items"][0]["statistics"]
+            video_likes = video_stats.get("likeCount", 0)
+            video_dislikes = video_stats.get("dislikeCount", 0)
+            video_comment_count = video_stats.get("commentCount", 0)
+
+            # Fetch video comments using YouTube Data API
+            comments_response = youtube.commentThreads().list(part="snippet", videoId=video_id).execute()
+            video_comments = [comment["snippet"]["topLevelComment"]["snippet"]["textDisplay"] for comment in comments_response.get("items", [])]
+
+            # Extract YouTuber's name and channel name
+            # channel_title = yt.author
+            channel_name_response = youtube.channels().list(part="snippet", id=yt.channel_id).execute()
+            channel_name = channel_name_response["items"][0]["snippet"]["title"]
+
+            # Store data in MySQL database
+            insert_query = """
+            INSERT INTO youtube_videos (title, description, likes, dislikes, comment_count, comments, video_url, channel_name, video_id)
+            VALUES (%s, %s, %s, %s, %s, %s, %s, %s, %s)
+            """
+            values = (video_title, video_description, video_likes, video_dislikes, video_comment_count, "\n".join(video_comments), video_url, channel_name, video_id)
+
+            db_cursor.execute(insert_query, values)
+            db_connection.commit()
+
+            print("Data inserted successfully!")
+        else:
+            print("Video already exists in the database.")
+
+    except Exception as e:
+        print("An error occurred:", str(e))
+
+
+def fetch_search_queries_from_file(file_path):
+    with open(file_path, "r") as file:
+        search_queries = file.read().splitlines()
+    return search_queries
+
+def fetch_and_store_fintech_influencer_data():
+    # Fetch fintech influencer video URLs using the YouTube Data API
+    youtube = build("youtube", "v3", developerKey=api_key)
+    search_queries = fetch_search_queries_from_file("search_queries.txt")
+    
+
+    for query in search_queries:
+        next_page_token = None
+        while True:
+            search_response = youtube.search().list(
+                q=query,
+                part="id",
+                maxResults=50,  # Maximum number of results per request
+                pageToken=next_page_token
+            ).execute()
+
+            for item in search_response["items"]:
+                try:
+                    video_id = item["id"]["videoId"]
+                    video_url = f"https://www.youtube.com/watch?v={video_id}"
+                    extract_and_store_youtube_data(video_url)
+                except KeyError as e:
+                    print("Error extracting videoId:", e)
+                    print("Item dictionary:", item)
+
+            # Check if there are more pages of results
+            next_page_token = search_response.get("nextPageToken")
+            if not next_page_token:
+                break  # No more results to fetch
+
+def main():
+    fetch_and_store_fintech_influencer_data()
+
+# Run the main function
+if __name__ == "__main__":
+    main()
+
+# Close the database connection
+db_cursor.close()
+db_connection.close()