From c14791f30959c1dc0eb2cfa389ef6126599d98d0 Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Thu, 13 Nov 2025 17:54:13 +0000
Subject: [PATCH 1/2] Reorganize and enhance repository with modular
 architecture

This comprehensive reorganization transforms the project from a single
monolithic script into a professional, production-ready package.

Major Changes:
- Created modular package structure under src/sentiment_analysis/
- Separated concerns into dedicated modules:
  * config.py - Configuration management
  * data_loader.py - Data loading and preprocessing
  * model.py - LSTM model architecture with variants
  * train.py - Training logic with callbacks
  * predict.py - Prediction logic with batch support
  * utils.py - Utility functions and helpers
  * visualization.py - Comprehensive plotting functions
  * cli.py - Command-line interface

New Features:
- CLI tools (sentiment-train, sentiment-predict)
- Python API for programmatic access
- Comprehensive unit tests with pytest
- Multiple usage examples (basic, custom, interactive)
- Jupyter notebook tutorial
- Model persistence (save/load)
- Training callbacks (early stopping, checkpointing, LR reduction)
- Rich visualizations (training curves, confusion matrix, ROC)
- Configuration management system
- Logging throughout

Documentation:
- Complete README rewrite with detailed usage instructions
- CONTRIBUTING.md with development guidelines
- Comprehensive docstrings in all modules
- Example scripts demonstrating various use cases

Infrastructure:
- setup.py for pip installation
- requirements.txt with all dependencies
- pytest.ini for test configuration
- Updated .gitignore for project structure

The old monolithic script is preserved as examples/legacy_monolithic_script.py
for reference.
---
 .gitignore                                    |  35 ++
 CONTRIBUTING.md                               | 331 ++++++++++++++++
 README.md                                     | 228 ++++++-----
 examples/basic_usage.py                       |  78 ++++
 examples/custom_training.py                   |  71 ++++
 .../legacy_monolithic_script.py               |   0
 examples/prediction_only.py                   |  73 ++++
 notebooks/sentiment_analysis_tutorial.ipynb   | 360 ++++++++++++++++++
 pytest.ini                                    |  31 ++
 requirements.txt                              |  24 ++
 setup.py                                      |  80 ++++
 src/sentiment_analysis/__init__.py            |  14 +
 src/sentiment_analysis/__main__.py            |   8 +
 src/sentiment_analysis/cli.py                 | 279 ++++++++++++++
 src/sentiment_analysis/config.py              |  57 +++
 src/sentiment_analysis/data_loader.py         | 157 ++++++++
 src/sentiment_analysis/model.py               | 190 +++++++++
 src/sentiment_analysis/predict.py             | 190 +++++++++
 src/sentiment_analysis/train.py               | 198 ++++++++++
 src/sentiment_analysis/utils.py               | 207 ++++++++++
 src/sentiment_analysis/visualization.py       | 241 ++++++++++++
 tests/__init__.py                             |   1 +
 tests/conftest.py                             |  26 ++
 tests/test_config.py                          |  44 +++
 tests/test_data_loader.py                     |  54 +++
 tests/test_model.py                           |  73 ++++
 tests/test_utils.py                           |  80 ++++
 27 files changed, 3034 insertions(+), 96 deletions(-)
 create mode 100644 CONTRIBUTING.md
 create mode 100644 examples/basic_usage.py
 create mode 100644 examples/custom_training.py
 rename sentiment_analysis_lstm.py => examples/legacy_monolithic_script.py (100%)
 create mode 100644 examples/prediction_only.py
 create mode 100644 notebooks/sentiment_analysis_tutorial.ipynb
 create mode 100644 pytest.ini
 create mode 100644 requirements.txt
 create mode 100644 setup.py
 create mode 100644 src/sentiment_analysis/__init__.py
 create mode 100644 src/sentiment_analysis/__main__.py
 create mode 100644 src/sentiment_analysis/cli.py
 create mode 100644 src/sentiment_analysis/config.py
 create mode 100644 src/sentiment_analysis/data_loader.py
 create mode 100644 src/sentiment_analysis/model.py
 create mode 100644 src/sentiment_analysis/predict.py
 create mode 100644 src/sentiment_analysis/train.py
 create mode 100644 src/sentiment_analysis/utils.py
 create mode 100644 src/sentiment_analysis/visualization.py
 create mode 100644 tests/__init__.py
 create mode 100644 tests/conftest.py
 create mode 100644 tests/test_config.py
 create mode 100644 tests/test_data_loader.py
 create mode 100644 tests/test_model.py
 create mode 100644 tests/test_utils.py

diff --git a/.gitignore b/.gitignore
index 82f9275..3c32e4e 100644
--- a/.gitignore
+++ b/.gitignore
@@ -160,3 +160,38 @@ cython_debug/
 #  and can be added to the global gitignore or merged into this file.  For a more nuclear
 #  option (not recommended) you can uncomment the following to ignore the entire idea folder.
 #.idea/
+
+# Project-specific
+models/*.h5
+models/*.pkl
+models/*.json
+data/*.csv
+data/*.txt
+data/*.npz
+outputs/
+logs/
+*.log
+
+# Saved models and checkpoints
+*.h5
+*.hdf5
+*.ckpt
+*.pb
+
+# Training artifacts
+training_history.json
+tensorboard_logs/
+
+# macOS
+.DS_Store
+.AppleDouble
+.LSOverride
+
+# VS Code
+.vscode/
+
+# Temporary files
+*.tmp
+*.bak
+*.swp
+*~
diff --git a/CONTRIBUTING.md b/CONTRIBUTING.md
new file mode 100644
index 0000000..c60b348
--- /dev/null
+++ b/CONTRIBUTING.md
@@ -0,0 +1,331 @@
+# Contributing to Sentiment Analysis LSTM
+
+Thank you for your interest in contributing to this project! We welcome contributions from everyone.
+
+## Table of Contents
+
+- [Code of Conduct](#code-of-conduct)
+- [How Can I Contribute?](#how-can-i-contribute)
+- [Development Setup](#development-setup)
+- [Coding Standards](#coding-standards)
+- [Testing](#testing)
+- [Pull Request Process](#pull-request-process)
+- [Reporting Bugs](#reporting-bugs)
+- [Suggesting Enhancements](#suggesting-enhancements)
+
+## Code of Conduct
+
+By participating in this project, you are expected to:
+
+- Use welcoming and inclusive language
+- Be respectful of differing viewpoints and experiences
+- Gracefully accept constructive criticism
+- Focus on what is best for the community
+- Show empathy towards other community members
+
+## How Can I Contribute?
+
+### Types of Contributions
+
+1. **Bug Fixes**: Fix identified bugs in the codebase
+2. **New Features**: Implement new functionality
+3. **Documentation**: Improve or expand documentation
+4. **Tests**: Add or improve test coverage
+5. **Examples**: Create helpful usage examples
+6. **Performance**: Optimize existing code
+
+## Development Setup
+
+### 1. Fork and Clone
+
+```bash
+# Fork the repository on GitHub
+# Clone your fork
+git clone https://github.com/YOUR-USERNAME/Sentiment-Analysis-LSTM.git
+cd Sentiment-Analysis-LSTM
+```
+
+### 2. Install Development Dependencies
+
+```bash
+# Create a virtual environment
+python -m venv venv
+source venv/bin/activate  # On Windows: venv\Scripts\activate
+
+# Install in development mode with dev dependencies
+pip install -e ".[dev]"
+```
+
+### 3. Create a Branch
+
+```bash
+git checkout -b feature/your-feature-name
+# or
+git checkout -b fix/your-bug-fix
+```
+
+## Coding Standards
+
+### Python Style Guide
+
+We follow PEP 8 with some modifications:
+
+- **Line Length**: Maximum 100 characters
+- **Indentation**: 4 spaces (no tabs)
+- **Quotes**: Use double quotes for strings
+- **Imports**: Organized using `isort`
+
+### Code Formatting
+
+We use the following tools:
+
+```bash
+# Format code with black
+black src/ tests/
+
+# Sort imports with isort
+isort src/ tests/
+
+# Lint with flake8
+flake8 src/ tests/
+```
+
+### Docstrings
+
+Use Google-style docstrings:
+
+```python
+def function_name(param1, param2):
+    """
+    Brief description of function.
+
+    Args:
+        param1 (type): Description of param1
+        param2 (type): Description of param2
+
+    Returns:
+        type: Description of return value
+
+    Raises:
+        ValueError: Description of when this is raised
+    """
+    pass
+```
+
+### Type Hints
+
+Use type hints where appropriate:
+
+```python
+def predict_text(self, text: str) -> dict:
+    """Predict sentiment for a single text."""
+    pass
+```
+
+## Testing
+
+### Running Tests
+
+```bash
+# Run all tests
+pytest
+
+# Run with coverage
+pytest --cov=sentiment_analysis --cov-report=html
+
+# Run specific test file
+pytest tests/test_model.py
+
+# Run specific test
+pytest tests/test_model.py::TestSentimentLSTM::test_build_model
+```
+
+### Writing Tests
+
+- Place tests in the `tests/` directory
+- Name test files `test_*.py`
+- Name test classes `Test*`
+- Name test functions `test_*`
+
+Example test:
+
+```python
+import pytest
+from sentiment_analysis.model import SentimentLSTM
+
+class TestSentimentLSTM:
+    """Test cases for SentimentLSTM class."""
+
+    def test_build_model(self):
+        """Test building the model."""
+        model = SentimentLSTM()
+        keras_model = model.build_model()
+        assert keras_model is not None
+        assert len(keras_model.layers) > 0
+```
+
+### Test Coverage
+
+- Aim for at least 80% code coverage
+- Write tests for all new features
+- Write tests for bug fixes
+
+## Pull Request Process
+
+### Before Submitting
+
+1. **Update Documentation**: Update README.md and docstrings
+2. **Add Tests**: Ensure new code is tested
+3. **Run Tests**: All tests must pass
+4. **Format Code**: Run black and isort
+5. **Check Linting**: Run flake8
+6. **Update CHANGELOG**: Add entry for your changes
+
+### Submitting
+
+1. **Commit Your Changes**
+
+```bash
+git add .
+git commit -m "Add: brief description of changes"
+```
+
+Commit message format:
+- `Add: <description>` for new features
+- `Fix: <description>` for bug fixes
+- `Update: <description>` for updates
+- `Refactor: <description>` for refactoring
+- `Docs: <description>` for documentation
+
+2. **Push to Your Fork**
+
+```bash
+git push origin feature/your-feature-name
+```
+
+3. **Open a Pull Request**
+
+- Go to the original repository on GitHub
+- Click "New Pull Request"
+- Select your fork and branch
+- Fill out the PR template
+- Link any related issues
+
+### PR Template
+
+```markdown
+## Description
+Brief description of changes
+
+## Type of Change
+- [ ] Bug fix
+- [ ] New feature
+- [ ] Documentation update
+- [ ] Performance improvement
+
+## Testing
+- [ ] Tests pass locally
+- [ ] Added new tests
+- [ ] Updated documentation
+
+## Related Issues
+Fixes #(issue number)
+```
+
+### Review Process
+
+- PRs require at least one approval
+- Address reviewer feedback
+- Keep PRs focused and small
+- Be patient and respectful
+
+## Reporting Bugs
+
+### Before Reporting
+
+1. **Search Existing Issues**: Check if already reported
+2. **Update to Latest Version**: Verify bug exists in latest version
+3. **Gather Information**: Collect error messages and logs
+
+### Bug Report Template
+
+```markdown
+**Describe the Bug**
+Clear description of the bug
+
+**To Reproduce**
+Steps to reproduce:
+1. Go to '...'
+2. Run '...'
+3. See error
+
+**Expected Behavior**
+What you expected to happen
+
+**Screenshots/Logs**
+If applicable, add screenshots or error logs
+
+**Environment**
+- OS: [e.g., Ubuntu 20.04]
+- Python Version: [e.g., 3.9]
+- TensorFlow Version: [e.g., 2.10.0]
+
+**Additional Context**
+Any other relevant information
+```
+
+## Suggesting Enhancements
+
+### Enhancement Template
+
+```markdown
+**Is your feature request related to a problem?**
+Clear description of the problem
+
+**Describe the solution you'd like**
+Clear description of desired behavior
+
+**Describe alternatives you've considered**
+Alternative solutions or features
+
+**Additional context**
+Any other relevant information
+```
+
+## Project Structure
+
+Understanding the structure:
+
+```
+src/sentiment_analysis/
+├── config.py          # Configuration management
+├── data_loader.py     # Data loading and preprocessing
+├── model.py           # Model architecture
+├── train.py           # Training logic
+├── predict.py         # Prediction logic
+├── utils.py           # Utility functions
+├── visualization.py   # Visualization functions
+└── cli.py             # Command-line interface
+```
+
+## Communication
+
+- **Issues**: For bug reports and feature requests
+- **Pull Requests**: For code contributions
+- **Discussions**: For questions and ideas
+
+## Recognition
+
+Contributors will be recognized in:
+- The project README
+- Release notes
+- A dedicated CONTRIBUTORS file
+
+## Questions?
+
+If you have questions:
+1. Check the documentation
+2. Search existing issues
+3. Open a new issue with the "question" label
+
+Thank you for contributing to Sentiment Analysis LSTM!
diff --git a/README.md b/README.md
index 72a0908..e7e2552 100644
--- a/README.md
+++ b/README.md
@@ -1,147 +1,183 @@
-# Sentiment Analysis with LSTM - Movie Reviews
+# Sentiment Analysis with LSTM
 
-This project demonstrates how to build a deep learning model using an **LSTM (Long Short-Term Memory)** neural network for sentiment analysis of movie reviews. The model is trained on the IMDB dataset to classify movie reviews as positive or negative.
+<div align="center">
 
-## Table of Contents
+A professional, modular sentiment analysis framework using LSTM neural networks for movie review classification.
 
-1. [Introduction](#introduction)
-2. [Features](#features)
-3. [Installation](#installation)
-4. [Usage](#usage)
-5. [Examples](#examples)
-6. [Contributing](#contributing)
-7. [License](#license)
+[![Python 3.8+](https://img.shields.io/badge/python-3.8+-blue.svg)](https://www.python.org/downloads/)
+[![TensorFlow](https://img.shields.io/badge/TensorFlow-2.10+-orange.svg)](https://www.tensorflow.org/)
+[![License: MIT](https://img.shields.io/badge/License-MIT-yellow.svg)](https://opensource.org/licenses/MIT)
 
-## Introduction
+</div>
 
-Sentiment analysis is a common natural language processing (NLP) task that involves classifying text into positive or negative sentiments. This project uses a deep learning approach with a **Bidirectional LSTM** neural network to perform sentiment analysis on movie reviews from the IMDB dataset. LSTMs are well-suited for this task because they are capable of learning long-term dependencies in sequential data.
+## Overview
 
-## Features
+This project provides a complete, production-ready implementation of sentiment analysis using Long Short-Term Memory (LSTM) neural networks. Built on TensorFlow/Keras, it offers a modular architecture, comprehensive testing, multiple interfaces (CLI, Python API, Jupyter notebooks), and extensive documentation.
 
-- **LSTM-based Neural Network**: A deep learning model using LSTM layers to handle the sequential nature of text data.
-- **Bidirectional LSTM**: Utilizes a bidirectional LSTM to capture dependencies from both forward and backward sequences.
-- **Embedding Layer**: Converts words into dense vector representations to capture semantic relationships.
-- **Dropout Regularization**: Prevents overfitting by randomly dropping neurons during training.
-- **Text Preprocessing**: Automatic tokenization and padding to handle varying input lengths.
-- **Sentiment Prediction**: Predicts whether a given movie review is positive or negative.
+### Key Features
 
-## Installation
+- **Modular Architecture**: Clean separation of concerns with dedicated modules for data loading, model building, training, prediction, and visualization
+- **Bidirectional LSTM**: Captures dependencies from both forward and backward sequences for improved accuracy
+- **Multiple Interfaces**:
+  - Python API for programmatic access
+  - CLI tools for command-line usage
+  - Jupyter notebooks for interactive exploration
+- **Comprehensive Testing**: Unit tests with pytest for reliability
+- **Production Ready**: Model persistence, logging, configuration management
+- **Rich Visualizations**: Training curves, confusion matrices, ROC curves, prediction distributions
+- **Easy Installation**: Simple pip installation with all dependencies
 
-### Prerequisites
+## Table of Contents
 
-Ensure you have the following installed:
+- [Installation](#installation)
+- [Quick Start](#quick-start)
+- [Project Structure](#project-structure)
+- [Usage](#usage)
+- [Model Architecture](#model-architecture)
+- [Configuration](#configuration)
+- [Examples](#examples)
+- [Testing](#testing)
+- [Contributing](#contributing)
+- [License](#license)
 
-- Python 3.x
-- TensorFlow
-- Matplotlib
+## Installation
+
+### Prerequisites
 
-### Install Required Packages
+- Python 3.8 or higher
+- pip package manager
 
-If you haven't installed TensorFlow and Matplotlib yet, you can do so using pip:
+### Install from Source
 
 ```bash
-pip install tensorflow matplotlib
+# Clone the repository
+git clone https://github.com/pyenthusiasts/Sentiment-Analysis-LSTM.git
+cd Sentiment-Analysis-LSTM
+
+# Install the package
+pip install -e .
 ```
 
-## Usage
+### Install Dependencies Only
 
-1. **Clone the Repository**:
+```bash
+pip install -r requirements.txt
+```
 
-   Clone the repository to your local machine:
+## Quick Start
 
-   ```bash
-   git clone https://github.com/your-username/sentiment-analysis-lstm.git
-   ```
+### Python API
 
-2. **Navigate to the Directory**:
+```python
+from sentiment_analysis.train import Trainer
+from sentiment_analysis.predict import Predictor
+
+# Train a model
+trainer = Trainer()
+(X_train, y_train), (X_test, y_test) = trainer.prepare_data()
+history = trainer.train(X_train, y_train, X_test, y_test)
+
+# Make predictions
+predictor = Predictor()
+result = predictor.predict_text("Amazing movie! Loved it!")
+print(f"Sentiment: {result['sentiment']} (Score: {result['score']:.2f})")
+```
 
-   Go to the project directory:
+## Project Structure
 
-   ```bash
-   cd sentiment-analysis-lstm
-   ```
+```
+Sentiment-Analysis-LSTM/
+├── src/sentiment_analysis/      # Main package
+│   ├── config.py                # Configuration
+│   ├── data_loader.py           # Data loading
+│   ├── model.py                 # Model architecture
+│   ├── train.py                 # Training logic
+│   ├── predict.py               # Prediction logic
+│   ├── utils.py                 # Utilities
+│   └── visualization.py         # Visualizations
+├── tests/                       # Unit tests
+├── examples/                    # Example scripts
+├── notebooks/                   # Jupyter notebooks
+├── requirements.txt             # Dependencies
+└── setup.py                     # Package setup
+```
 
-3. **Run the Script**:
+## Usage
 
-   Run the script using Python:
+### Training a Model
 
-   ```bash
-   python sentiment_analysis_lstm.py
-   ```
+```python
+from sentiment_analysis.train import Trainer
 
-### Running the Program
+trainer = Trainer()
+(X_train, y_train), (X_test, y_test) = trainer.prepare_data()
+history = trainer.train(X_train, y_train, X_test, y_test, epochs=5)
+```
 
-When you run the script, it will:
+### Making Predictions
 
-- Load the IMDB dataset.
-- Preprocess the text data (tokenization and padding).
-- Define and compile an LSTM-based neural network model.
-- Train the model on the training set and validate it on a validation set.
-- Evaluate the model on the test set.
-- Plot the training and validation accuracy and loss over epochs.
-- Predict the sentiment of a new movie review sample.
+```python
+from sentiment_analysis.predict import Predictor
 
-## Examples
+predictor = Predictor()
+result = predictor.predict_text("This movie was amazing!")
+print(f"Sentiment: {result['sentiment']}")
+print(f"Confidence: {result['confidence']:.2%}")
+```
 
-### Output
+## Model Architecture
 
-The script will produce outputs similar to:
+1. **Embedding Layer**: 128-dimensional word embeddings
+2. **Bidirectional LSTM**: 64 units processing in both directions
+3. **Dropout**: 0.5 rate for regularization
+4. **LSTM**: 32 units  
+5. **Dense Output**: Sigmoid activation for binary classification
 
-1. **Test Accuracy**: The accuracy of the model on the test dataset, for example:
+## Configuration
 
-   ```
-   Test Accuracy: 0.86
-   ```
+Edit `src/sentiment_analysis/config.py` to customize:
 
-2. **Training and Validation Curves**: Plots of accuracy and loss over the training epochs.
+- `VOCAB_SIZE`: 10000 (vocabulary size)
+- `MAX_LENGTH`: 300 (sequence length)
+- `EMBEDDING_DIM`: 128
+- `BATCH_SIZE`: 128
+- `EPOCHS`: 5
 
-   ![Accuracy and Loss Plot](accuracy_loss_plot.png)
+## Examples
 
-3. **Predicted Sentiment**: Displays the predicted sentiment (positive or negative) for a new review.
+Run example scripts:
 
-   ```
-   Predicted Sentiment: Positive
-   ```
+```bash
+python examples/basic_usage.py
+python examples/custom_training.py
+python examples/prediction_only.py
+```
 
-### Predicting New Reviews
+## Testing
 
-To predict the sentiment of a new movie review, you can modify the `new_review` variable in the script:
+```bash
+# Run all tests
+pytest
 
-```python
-new_review = "This movie was fantastic! I really enjoyed the story and the acting was superb."
+# Run with coverage
+pytest --cov=sentiment_analysis
 ```
 
-Run the script again to see the predicted sentiment.
-
 ## Contributing
 
-Contributions are welcome! If you have ideas for new features, improvements, or bug fixes, please feel free to open an issue or create a pull request.
-
-### Steps to Contribute
-
-1. **Fork the Repository**: Click the 'Fork' button at the top right of this page.
-2. **Clone Your Fork**: Clone your forked repository to your local machine.
-   ```bash
-   git clone https://github.com/your-username/sentiment-analysis-lstm.git
-   ```
-3. **Create a Branch**: Create a new branch for your feature or bug fix.
-   ```bash
-   git checkout -b feature/your-feature-name
-   ```
-4. **Make Changes**: Make your changes and commit them with a descriptive message.
-   ```bash
-   git commit -m "Add: feature description"
-   ```
-5. **Push Changes**: Push your changes to your forked repository.
-   ```bash
-   git push origin feature/your-feature-name
-   ```
-6. **Create a Pull Request**: Go to the original repository on GitHub and create a pull request.
+Contributions welcome! See [CONTRIBUTING.md](CONTRIBUTING.md) for guidelines.
 
 ## License
 
-This project is licensed under the MIT License - see the [LICENSE](LICENSE) file for details.
+MIT License - see [LICENSE](LICENSE) for details.
+
+## Acknowledgments
+
+- Built with [TensorFlow](https://www.tensorflow.org/) and [Keras](https://keras.io/)
+- IMDB dataset from [Stanford AI Lab](http://ai.stanford.edu/~amaas/data/sentiment/)
 
 ---
 
-Thank you for using the Sentiment Analysis with LSTM! If you have any questions or feedback, feel free to reach out. Happy coding! 😊
+<div align="center">
+Made with passion for NLP and Deep Learning
+</div>
diff --git a/examples/basic_usage.py b/examples/basic_usage.py
new file mode 100644
index 0000000..0d5547b
--- /dev/null
+++ b/examples/basic_usage.py
@@ -0,0 +1,78 @@
+"""
+Basic usage example for the sentiment analysis package.
+
+This script demonstrates how to:
+1. Train a sentiment analysis model
+2. Make predictions on new text
+3. Visualize training results
+"""
+
+import sys
+from pathlib import Path
+
+# Add src to path for local development
+sys.path.insert(0, str(Path(__file__).parent.parent / 'src'))
+
+from sentiment_analysis.train import Trainer
+from sentiment_analysis.predict import Predictor
+from sentiment_analysis.visualization import Visualizer
+
+
+def main():
+    """Run basic usage example."""
+    print("=" * 70)
+    print(" Sentiment Analysis LSTM - Basic Usage Example ".center(70, "="))
+    print("=" * 70)
+
+    # Step 1: Train the model
+    print("\n[1/3] Training the model...")
+    print("-" * 70)
+
+    trainer = Trainer()
+    (X_train, y_train), (X_test, y_test) = trainer.prepare_data()
+
+    history = trainer.train(
+        X_train,
+        y_train,
+        X_test,
+        y_test,
+        epochs=2,  # Use fewer epochs for quick demo
+        verbose=1
+    )
+
+    # Step 2: Visualize training results
+    print("\n[2/3] Visualizing training results...")
+    print("-" * 70)
+
+    visualizer = Visualizer(output_dir='outputs')
+    visualizer.plot_training_history(history)
+
+    # Step 3: Make predictions
+    print("\n[3/3] Making predictions...")
+    print("-" * 70)
+
+    predictor = Predictor()
+
+    # Example texts to analyze
+    example_texts = [
+        "This movie was absolutely fantastic! Best film I've seen this year.",
+        "Terrible movie. Complete waste of time and money.",
+        "It was okay. Nothing special, but not terrible either.",
+        "Outstanding performance by the lead actor. Highly recommended!",
+    ]
+
+    print("\nPredictions:")
+    for i, text in enumerate(example_texts, 1):
+        result = predictor.predict_text(text)
+        print(f"\n{i}. Text: {text}")
+        print(f"   Sentiment: {result['sentiment']}")
+        print(f"   Score: {result['score']:.4f}")
+        print(f"   Confidence: {result['confidence']:.4f}")
+
+    print("\n" + "=" * 70)
+    print(" Example Complete! ".center(70, "="))
+    print("=" * 70)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/examples/custom_training.py b/examples/custom_training.py
new file mode 100644
index 0000000..c7ab064
--- /dev/null
+++ b/examples/custom_training.py
@@ -0,0 +1,71 @@
+"""
+Custom training example with advanced options.
+
+This script demonstrates:
+1. Custom hyperparameter configuration
+2. Different model architectures
+3. Advanced training options
+"""
+
+import sys
+from pathlib import Path
+
+sys.path.insert(0, str(Path(__file__).parent.parent / 'src'))
+
+from sentiment_analysis.train import Trainer
+from sentiment_analysis.config import ModelConfig
+from sentiment_analysis.visualization import Visualizer
+
+
+def main():
+    """Run custom training example."""
+    print("=" * 70)
+    print(" Custom Training Example ".center(70, "="))
+    print("=" * 70)
+
+    # Customize configuration
+    print("\n[1] Customizing model configuration...")
+    ModelConfig.EPOCHS = 3
+    ModelConfig.BATCH_SIZE = 64
+    ModelConfig.LEARNING_RATE = 0.0005
+    ModelConfig.DROPOUT_RATE = 0.3
+
+    print(f"Epochs: {ModelConfig.EPOCHS}")
+    print(f"Batch Size: {ModelConfig.BATCH_SIZE}")
+    print(f"Learning Rate: {ModelConfig.LEARNING_RATE}")
+    print(f"Dropout Rate: {ModelConfig.DROPOUT_RATE}")
+
+    # Initialize trainer
+    print("\n[2] Preparing data...")
+    trainer = Trainer()
+    (X_train, y_train), (X_test, y_test) = trainer.prepare_data()
+
+    # Train with custom options
+    print("\n[3] Training with custom options...")
+    history = trainer.train(
+        X_train,
+        y_train,
+        X_test,
+        y_test,
+        bidirectional=True,
+        spatial_dropout=True,
+        patience=2,
+        verbose=1
+    )
+
+    # Get best epoch
+    best_epoch, best_val_acc = trainer.get_best_epoch()
+    print(f"\nBest validation accuracy: {best_val_acc:.4f} at epoch {best_epoch}")
+
+    # Visualize
+    print("\n[4] Creating visualizations...")
+    visualizer = Visualizer(output_dir='outputs')
+    visualizer.plot_training_history(history)
+
+    print("\n" + "=" * 70)
+    print(" Training Complete! ".center(70, "="))
+    print("=" * 70)
+
+
+if __name__ == '__main__':
+    main()
diff --git a/sentiment_analysis_lstm.py b/examples/legacy_monolithic_script.py
similarity index 100%
rename from sentiment_analysis_lstm.py
rename to examples/legacy_monolithic_script.py
diff --git a/examples/prediction_only.py b/examples/prediction_only.py
new file mode 100644
index 0000000..ef46285
--- /dev/null
+++ b/examples/prediction_only.py
@@ -0,0 +1,73 @@
+"""
+Prediction-only example using a pre-trained model.
+
+This script demonstrates how to use a trained model for predictions
+without retraining.
+"""
+
+import sys
+from pathlib import Path
+
+sys.path.insert(0, str(Path(__file__).parent.parent / 'src'))
+
+from sentiment_analysis.predict import Predictor
+from sentiment_analysis.config import ModelConfig
+
+
+def main():
+    """Run prediction example."""
+    print("=" * 70)
+    print(" Sentiment Prediction Example ".center(70, "="))
+    print("=" * 70)
+
+    # Check if model exists
+    if not ModelConfig.MODEL_PATH.exists():
+        print("\nError: No trained model found!")
+        print(f"Expected model at: {ModelConfig.MODEL_PATH}")
+        print("\nPlease train a model first by running:")
+        print("  python examples/basic_usage.py")
+        print("  or")
+        print("  sentiment-train")
+        return
+
+    # Initialize predictor
+    print("\nLoading trained model...")
+    predictor = Predictor()
+
+    # Interactive prediction loop
+    print("\n" + "-" * 70)
+    print("Enter movie reviews to analyze (or 'quit' to exit)")
+    print("-" * 70)
+
+    while True:
+        print("\nEnter review text:")
+        text = input("> ")
+
+        if text.lower() in ['quit', 'exit', 'q']:
+            break
+
+        if not text.strip():
+            continue
+
+        # Make prediction
+        result = predictor.predict_text(text)
+
+        # Display result
+        print("\nPrediction:")
+        print(f"  Sentiment: {result['sentiment']}")
+        print(f"  Score: {result['score']:.4f}")
+        print(f"  Confidence: {result['confidence']:.2%}")
+
+        # Interpret confidence
+        if result['confidence'] > 0.8:
+            print("  (Very confident)")
+        elif result['confidence'] > 0.5:
+            print("  (Moderately confident)")
+        else:
+            print("  (Low confidence - neutral text)")
+
+    print("\nGoodbye!")
+
+
+if __name__ == '__main__':
+    main()
diff --git a/notebooks/sentiment_analysis_tutorial.ipynb b/notebooks/sentiment_analysis_tutorial.ipynb
new file mode 100644
index 0000000..d5dd0e4
--- /dev/null
+++ b/notebooks/sentiment_analysis_tutorial.ipynb
@@ -0,0 +1,360 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# Sentiment Analysis with LSTM - Complete Tutorial\n",
+    "\n",
+    "This notebook provides a comprehensive tutorial on using the Sentiment Analysis LSTM package.\n",
+    "\n",
+    "## Table of Contents\n",
+    "1. [Setup and Installation](#setup)\n",
+    "2. [Data Loading and Exploration](#data)\n",
+    "3. [Model Training](#training)\n",
+    "4. [Making Predictions](#predictions)\n",
+    "5. [Visualization](#visualization)\n",
+    "6. [Advanced Usage](#advanced)"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 1. Setup and Installation <a name=\"setup\"></a>\n",
+    "\n",
+    "First, let's import the necessary modules and set up our environment."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import sys\n",
+    "from pathlib import Path\n",
+    "\n",
+    "# Add src to path\n",
+    "sys.path.insert(0, str(Path.cwd().parent / 'src'))\n",
+    "\n",
+    "import numpy as np\n",
+    "import matplotlib.pyplot as plt\n",
+    "\n",
+    "from sentiment_analysis.data_loader import DataLoader\n",
+    "from sentiment_analysis.model import SentimentLSTM\n",
+    "from sentiment_analysis.train import Trainer\n",
+    "from sentiment_analysis.predict import Predictor\n",
+    "from sentiment_analysis.visualization import Visualizer\n",
+    "from sentiment_analysis.config import ModelConfig\n",
+    "\n",
+    "print(\"All imports successful!\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 2. Data Loading and Exploration <a name=\"data\"></a>\n",
+    "\n",
+    "Let's load the IMDB dataset and explore its structure."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Initialize data loader\n",
+    "data_loader = DataLoader(vocab_size=10000, max_length=300)\n",
+    "\n",
+    "# Load IMDB data\n",
+    "print(\"Loading IMDB dataset...\")\n",
+    "(X_train, y_train), (X_test, y_test) = data_loader.load_imdb_data()\n",
+    "\n",
+    "print(f\"\\nTraining samples: {len(X_train)}\")\n",
+    "print(f\"Test samples: {len(X_test)}\")\n",
+    "print(f\"Sequence length: {X_train.shape[1]}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get data statistics\n",
+    "stats = data_loader.get_data_statistics(X_train, y_train, X_test, y_test)\n",
+    "\n",
+    "print(\"\\nDataset Statistics:\")\n",
+    "print(\"-\" * 50)\n",
+    "for key, value in stats.items():\n",
+    "    print(f\"{key:20s}: {value}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Decode and view a sample review\n",
+    "sample_idx = 0\n",
+    "decoded_review = data_loader.decode_review(X_train[sample_idx])\n",
+    "sentiment = \"Positive\" if y_train[sample_idx] == 1 else \"Negative\"\n",
+    "\n",
+    "print(f\"\\nSample Review (Index {sample_idx}):\")\n",
+    "print(f\"Sentiment: {sentiment}\")\n",
+    "print(f\"\\nText: {decoded_review[:200]}...\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 3. Model Training <a name=\"training\"></a>\n",
+    "\n",
+    "Now let's build and train our LSTM model."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Configure training parameters\n",
+    "ModelConfig.EPOCHS = 3  # Use fewer epochs for demo\n",
+    "ModelConfig.BATCH_SIZE = 128\n",
+    "ModelConfig.VALIDATION_SPLIT = 0.2\n",
+    "\n",
+    "print(\"Training Configuration:\")\n",
+    "print(f\"Epochs: {ModelConfig.EPOCHS}\")\n",
+    "print(f\"Batch Size: {ModelConfig.BATCH_SIZE}\")\n",
+    "print(f\"Validation Split: {ModelConfig.VALIDATION_SPLIT}\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Initialize and train\n",
+    "trainer = Trainer()\n",
+    "\n",
+    "print(\"\\nStarting training...\")\n",
+    "history = trainer.train(\n",
+    "    X_train,\n",
+    "    y_train,\n",
+    "    X_test,\n",
+    "    y_test,\n",
+    "    bidirectional=True,\n",
+    "    spatial_dropout=False,\n",
+    "    patience=2,\n",
+    "    verbose=1\n",
+    ")\n",
+    "\n",
+    "print(\"\\nTraining complete!\")"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Get best epoch\n",
+    "best_epoch, best_val_acc = trainer.get_best_epoch()\n",
+    "print(f\"Best Epoch: {best_epoch}\")\n",
+    "print(f\"Best Validation Accuracy: {best_val_acc:.4f}\")\n",
+    "print(f\"Test Accuracy: {history['test_accuracy']:.4f}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 4. Making Predictions <a name=\"predictions\"></a>\n",
+    "\n",
+    "Let's use our trained model to make predictions on new text."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Initialize predictor\n",
+    "predictor = Predictor()\n",
+    "\n",
+    "# Example reviews\n",
+    "example_reviews = [\n",
+    "    \"This movie was absolutely fantastic! The acting was superb and the plot kept me engaged throughout.\",\n",
+    "    \"Terrible waste of time. The plot was predictable and the acting was mediocre at best.\",\n",
+    "    \"It was okay. Nothing special, but I didn't hate it.\",\n",
+    "    \"A masterpiece! One of the best films I've ever seen. Highly recommended!\",\n",
+    "    \"Boring and slow. I couldn't wait for it to end.\",\n",
+    "]\n",
+    "\n",
+    "print(\"\\nPredictions on Example Reviews:\")\n",
+    "print(\"=\" * 80)\n",
+    "\n",
+    "for i, review in enumerate(example_reviews, 1):\n",
+    "    result = predictor.predict_text(review)\n",
+    "    \n",
+    "    print(f\"\\n{i}. {review}\")\n",
+    "    print(f\"   → Sentiment: {result['sentiment']}\")\n",
+    "    print(f\"   → Score: {result['score']:.4f}\")\n",
+    "    print(f\"   → Confidence: {result['confidence']:.2%}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 5. Visualization <a name=\"visualization\"></a>\n",
+    "\n",
+    "Let's visualize the training history and model performance."
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Create visualizer\n",
+    "visualizer = Visualizer(output_dir='../outputs')\n",
+    "\n",
+    "# Plot training history\n",
+    "visualizer.plot_training_history(history)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Evaluate and get predictions for visualization\n",
+    "y_pred_proba = trainer.model.model.predict(X_test, verbose=0)\n",
+    "y_pred = (y_pred_proba > 0.5).astype(int).flatten()\n",
+    "\n",
+    "# Plot prediction distribution\n",
+    "visualizer.plot_prediction_distribution(y_pred_proba.flatten(), y_test)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Plot confusion matrix\n",
+    "from sklearn.metrics import confusion_matrix\n",
+    "\n",
+    "cm = confusion_matrix(y_test, y_pred)\n",
+    "visualizer.plot_confusion_matrix(cm, labels=['Negative', 'Positive'])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Plot ROC curve\n",
+    "visualizer.plot_roc_curve(y_test, y_pred_proba.flatten())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## 6. Advanced Usage <a name=\"advanced\"></a>\n",
+    "\n",
+    "### Custom Model Architecture"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Build a custom model\n",
+    "custom_model = SentimentLSTM()\n",
+    "model = custom_model.build_model(\n",
+    "    bidirectional=True,\n",
+    "    spatial_dropout=True\n",
+    ")\n",
+    "\n",
+    "# View model summary\n",
+    "print(custom_model.get_model_summary())"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "### Interactive Prediction"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Try your own review!\n",
+    "user_review = \"Your review text here\"\n",
+    "\n",
+    "result = predictor.predict_text(user_review)\n",
+    "\n",
+    "print(f\"\\nYour review: {user_review}\")\n",
+    "print(f\"Predicted sentiment: {result['sentiment']}\")\n",
+    "print(f\"Confidence: {result['confidence']:.2%}\")"
+   ]
+  },
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "## Conclusion\n",
+    "\n",
+    "This tutorial covered:\n",
+    "- Loading and exploring the IMDB dataset\n",
+    "- Training an LSTM model for sentiment analysis\n",
+    "- Making predictions on new text\n",
+    "- Visualizing model performance\n",
+    "- Advanced customization options\n",
+    "\n",
+    "For more information, check out the documentation and examples in the repository!"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.8.0"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 4
+}
diff --git a/pytest.ini b/pytest.ini
new file mode 100644
index 0000000..8e6eed2
--- /dev/null
+++ b/pytest.ini
@@ -0,0 +1,31 @@
+[pytest]
+# Pytest configuration
+testpaths = tests
+python_files = test_*.py
+python_classes = Test*
+python_functions = test_*
+
+# Show summary
+addopts =
+    -v
+    --tb=short
+    --strict-markers
+    --disable-warnings
+
+# Markers
+markers =
+    slow: marks tests as slow (deselect with '-m "not slow"')
+    integration: marks tests as integration tests
+    unit: marks tests as unit tests
+
+# Coverage
+[coverage:run]
+source = src/sentiment_analysis
+omit =
+    */tests/*
+    */setup.py
+
+[coverage:report]
+precision = 2
+show_missing = True
+skip_covered = False
diff --git a/requirements.txt b/requirements.txt
new file mode 100644
index 0000000..29e8e68
--- /dev/null
+++ b/requirements.txt
@@ -0,0 +1,24 @@
+# Core dependencies
+tensorflow>=2.10.0
+numpy>=1.21.0
+matplotlib>=3.5.0
+seaborn>=0.12.0
+
+# Data processing
+pandas>=1.4.0
+scikit-learn>=1.0.0
+
+# Utilities
+tqdm>=4.64.0
+
+# Development dependencies
+pytest>=7.0.0
+pytest-cov>=3.0.0
+black>=22.0.0
+flake8>=4.0.0
+isort>=5.10.0
+
+# Jupyter
+jupyter>=1.0.0
+ipython>=8.0.0
+notebook>=6.4.0
diff --git a/setup.py b/setup.py
new file mode 100644
index 0000000..2e72164
--- /dev/null
+++ b/setup.py
@@ -0,0 +1,80 @@
+"""Setup script for the sentiment analysis package."""
+
+from setuptools import setup, find_packages
+from pathlib import Path
+
+# Read the README file
+readme_file = Path(__file__).parent / "README.md"
+if readme_file.exists():
+    with open(readme_file, "r", encoding="utf-8") as f:
+        long_description = f.read()
+else:
+    long_description = "Sentiment Analysis with LSTM Neural Networks"
+
+# Read requirements
+requirements_file = Path(__file__).parent / "requirements.txt"
+if requirements_file.exists():
+    with open(requirements_file, "r", encoding="utf-8") as f:
+        requirements = [
+            line.strip()
+            for line in f
+            if line.strip() and not line.startswith("#")
+        ]
+else:
+    requirements = [
+        "tensorflow>=2.10.0",
+        "numpy>=1.21.0",
+        "matplotlib>=3.5.0",
+        "seaborn>=0.12.0",
+        "scikit-learn>=1.0.0",
+    ]
+
+setup(
+    name="sentiment-analysis-lstm",
+    version="1.0.0",
+    author="Your Name",
+    author_email="your.email@example.com",
+    description="Sentiment analysis using LSTM neural networks on IMDB movie reviews",
+    long_description=long_description,
+    long_description_content_type="text/markdown",
+    url="https://github.com/pyenthusiasts/Sentiment-Analysis-LSTM",
+    package_dir={"": "src"},
+    packages=find_packages(where="src"),
+    classifiers=[
+        "Development Status :: 4 - Beta",
+        "Intended Audience :: Developers",
+        "Intended Audience :: Science/Research",
+        "Topic :: Scientific/Engineering :: Artificial Intelligence",
+        "Topic :: Text Processing :: Linguistic",
+        "License :: OSI Approved :: MIT License",
+        "Programming Language :: Python :: 3",
+        "Programming Language :: Python :: 3.8",
+        "Programming Language :: Python :: 3.9",
+        "Programming Language :: Python :: 3.10",
+        "Programming Language :: Python :: 3.11",
+    ],
+    python_requires=">=3.8",
+    install_requires=requirements,
+    extras_require={
+        "dev": [
+            "pytest>=7.0.0",
+            "pytest-cov>=3.0.0",
+            "black>=22.0.0",
+            "flake8>=4.0.0",
+            "isort>=5.10.0",
+        ],
+        "jupyter": [
+            "jupyter>=1.0.0",
+            "ipython>=8.0.0",
+            "notebook>=6.4.0",
+        ],
+    },
+    entry_points={
+        "console_scripts": [
+            "sentiment-train=sentiment_analysis.cli:train_command",
+            "sentiment-predict=sentiment_analysis.cli:predict_command",
+        ],
+    },
+    include_package_data=True,
+    zip_safe=False,
+)
diff --git a/src/sentiment_analysis/__init__.py b/src/sentiment_analysis/__init__.py
new file mode 100644
index 0000000..09c8f42
--- /dev/null
+++ b/src/sentiment_analysis/__init__.py
@@ -0,0 +1,14 @@
+"""
+Sentiment Analysis with LSTM
+A modular package for sentiment analysis using LSTM neural networks.
+"""
+
+__version__ = "1.0.0"
+__author__ = "Your Name"
+
+from sentiment_analysis.model import SentimentLSTM
+from sentiment_analysis.data_loader import DataLoader
+from sentiment_analysis.train import Trainer
+from sentiment_analysis.predict import Predictor
+
+__all__ = ["SentimentLSTM", "DataLoader", "Trainer", "Predictor"]
diff --git a/src/sentiment_analysis/__main__.py b/src/sentiment_analysis/__main__.py
new file mode 100644
index 0000000..e6c68e5
--- /dev/null
+++ b/src/sentiment_analysis/__main__.py
@@ -0,0 +1,8 @@
+"""
+Entry point for running the sentiment analysis package as a module.
+"""
+
+from sentiment_analysis.cli import main
+
+if __name__ == '__main__':
+    main()
diff --git a/src/sentiment_analysis/cli.py b/src/sentiment_analysis/cli.py
new file mode 100644
index 0000000..19647eb
--- /dev/null
+++ b/src/sentiment_analysis/cli.py
@@ -0,0 +1,279 @@
+"""
+Command-line interface for sentiment analysis.
+"""
+
+import argparse
+import sys
+import json
+from pathlib import Path
+
+from sentiment_analysis.train import Trainer
+from sentiment_analysis.predict import Predictor
+from sentiment_analysis.config import ModelConfig
+from sentiment_analysis.visualization import Visualizer
+from sentiment_analysis.utils import setup_logger, print_section
+
+logger = setup_logger(__name__)
+
+
+def train_command():
+    """CLI command for training the model."""
+    parser = argparse.ArgumentParser(
+        description='Train a sentiment analysis LSTM model',
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+        epilog="""
+Examples:
+  # Train with default settings
+  sentiment-train
+
+  # Train with custom epochs and batch size
+  sentiment-train --epochs 10 --batch-size 64
+
+  # Train with spatial dropout
+  sentiment-train --spatial-dropout --patience 5
+        """
+    )
+
+    # Training parameters
+    parser.add_argument(
+        '--epochs',
+        type=int,
+        default=ModelConfig.EPOCHS,
+        help=f'Number of training epochs (default: {ModelConfig.EPOCHS})'
+    )
+    parser.add_argument(
+        '--batch-size',
+        type=int,
+        default=ModelConfig.BATCH_SIZE,
+        help=f'Batch size for training (default: {ModelConfig.BATCH_SIZE})'
+    )
+    parser.add_argument(
+        '--validation-split',
+        type=float,
+        default=ModelConfig.VALIDATION_SPLIT,
+        help=f'Validation split ratio (default: {ModelConfig.VALIDATION_SPLIT})'
+    )
+    parser.add_argument(
+        '--learning-rate',
+        type=float,
+        default=ModelConfig.LEARNING_RATE,
+        help=f'Learning rate (default: {ModelConfig.LEARNING_RATE})'
+    )
+
+    # Model architecture
+    parser.add_argument(
+        '--no-bidirectional',
+        action='store_true',
+        help='Use unidirectional LSTM instead of bidirectional'
+    )
+    parser.add_argument(
+        '--spatial-dropout',
+        action='store_true',
+        help='Use spatial dropout in the model'
+    )
+
+    # Early stopping
+    parser.add_argument(
+        '--patience',
+        type=int,
+        default=3,
+        help='Patience for early stopping (default: 3)'
+    )
+
+    # Output options
+    parser.add_argument(
+        '--verbose',
+        type=int,
+        choices=[0, 1, 2],
+        default=2,
+        help='Verbosity mode (0=silent, 1=progress, 2=detailed)'
+    )
+    parser.add_argument(
+        '--no-plots',
+        action='store_true',
+        help='Skip generating plots after training'
+    )
+
+    args = parser.parse_args()
+
+    print_section("Sentiment Analysis LSTM - Training")
+
+    # Update config with command-line arguments
+    if args.learning_rate != ModelConfig.LEARNING_RATE:
+        ModelConfig.LEARNING_RATE = args.learning_rate
+        logger.info(f"Learning rate set to {args.learning_rate}")
+
+    # Initialize trainer
+    trainer = Trainer()
+
+    # Prepare data
+    (X_train, y_train), (X_test, y_test) = trainer.prepare_data()
+
+    # Train model
+    history = trainer.train(
+        X_train,
+        y_train,
+        X_test,
+        y_test,
+        epochs=args.epochs,
+        batch_size=args.batch_size,
+        validation_split=args.validation_split,
+        bidirectional=not args.no_bidirectional,
+        spatial_dropout=args.spatial_dropout,
+        patience=args.patience,
+        verbose=args.verbose
+    )
+
+    # Get best epoch
+    best_epoch, best_val_acc = trainer.get_best_epoch()
+    if best_epoch:
+        logger.info(f"\nBest epoch: {best_epoch} (Val Accuracy: {best_val_acc:.4f})")
+
+    # Plot results
+    if not args.no_plots:
+        logger.info("Generating training plots...")
+        visualizer = Visualizer()
+        visualizer.plot_training_history(history)
+
+    print_section("Training Complete!")
+    logger.info(f"Model saved to: {ModelConfig.MODEL_PATH}")
+    logger.info(f"History saved to: {ModelConfig.HISTORY_PATH}")
+
+
+def predict_command():
+    """CLI command for making predictions."""
+    parser = argparse.ArgumentParser(
+        description='Predict sentiment using trained LSTM model',
+        formatter_class=argparse.RawDescriptionHelpFormatter,
+        epilog="""
+Examples:
+  # Predict sentiment for a single text
+  sentiment-predict --text "This movie was amazing!"
+
+  # Run predictions on example texts
+  sentiment-predict --examples
+
+  # Predict from a file (one text per line)
+  sentiment-predict --file reviews.txt
+
+  # Save predictions to JSON
+  sentiment-predict --examples --output predictions.json
+        """
+    )
+
+    # Input options
+    input_group = parser.add_mutually_exclusive_group(required=True)
+    input_group.add_argument(
+        '--text',
+        type=str,
+        help='Text to analyze'
+    )
+    input_group.add_argument(
+        '--file',
+        type=Path,
+        help='File containing texts (one per line)'
+    )
+    input_group.add_argument(
+        '--examples',
+        action='store_true',
+        help='Run predictions on example texts'
+    )
+
+    # Model options
+    parser.add_argument(
+        '--model',
+        type=Path,
+        help=f'Path to trained model (default: {ModelConfig.MODEL_PATH})'
+    )
+
+    # Output options
+    parser.add_argument(
+        '--output',
+        type=Path,
+        help='Save predictions to JSON file'
+    )
+    parser.add_argument(
+        '--verbose',
+        action='store_true',
+        help='Show detailed prediction information'
+    )
+
+    args = parser.parse_args()
+
+    print_section("Sentiment Analysis LSTM - Prediction")
+
+    # Initialize predictor
+    model_path = args.model or ModelConfig.MODEL_PATH
+    predictor = Predictor(model_path=model_path)
+
+    results = []
+
+    # Handle different input types
+    if args.text:
+        # Single text prediction
+        result = predictor.predict_text(args.text)
+        results = [result]
+
+        # Display result
+        logger.info(f"\nText: {result['text']}")
+        logger.info(f"Sentiment: {result['sentiment']}")
+        logger.info(f"Score: {result['score']:.4f}")
+        logger.info(f"Confidence: {result['confidence']:.4f}")
+
+    elif args.file:
+        # Batch prediction from file
+        if not args.file.exists():
+            logger.error(f"File not found: {args.file}")
+            sys.exit(1)
+
+        with open(args.file, 'r', encoding='utf-8') as f:
+            texts = [line.strip() for line in f if line.strip()]
+
+        logger.info(f"Loaded {len(texts)} texts from {args.file}")
+        results = predictor.predict_batch(texts)
+
+        # Display results
+        for i, result in enumerate(results, 1):
+            logger.info(f"\n[{i}] {result['text'][:60]}...")
+            logger.info(f"    Sentiment: {result['sentiment']} (Score: {result['score']:.4f})")
+
+    elif args.examples:
+        # Run example predictions
+        results = predictor.predict_examples()
+
+    # Save results if output file specified
+    if args.output:
+        with open(args.output, 'w', encoding='utf-8') as f:
+            json.dump(results, f, indent=2)
+        logger.info(f"\nPredictions saved to: {args.output}")
+
+    print_section("Prediction Complete!")
+
+
+def main():
+    """Main entry point for CLI."""
+    parser = argparse.ArgumentParser(
+        description='Sentiment Analysis with LSTM',
+        formatter_class=argparse.RawDescriptionHelpFormatter
+    )
+
+    subparsers = parser.add_subparsers(dest='command', help='Available commands')
+
+    # Train command
+    train_parser = subparsers.add_parser('train', help='Train the model')
+    train_parser.set_defaults(func=train_command)
+
+    # Predict command
+    predict_parser = subparsers.add_parser('predict', help='Make predictions')
+    predict_parser.set_defaults(func=predict_command)
+
+    args = parser.parse_args()
+
+    if hasattr(args, 'func'):
+        args.func()
+    else:
+        parser.print_help()
+
+
+if __name__ == '__main__':
+    main()
diff --git a/src/sentiment_analysis/config.py b/src/sentiment_analysis/config.py
new file mode 100644
index 0000000..8d070e3
--- /dev/null
+++ b/src/sentiment_analysis/config.py
@@ -0,0 +1,57 @@
+"""
+Configuration settings for the sentiment analysis model.
+"""
+
+import os
+from pathlib import Path
+
+# Project directories
+PROJECT_ROOT = Path(__file__).parent.parent.parent
+DATA_DIR = PROJECT_ROOT / "data"
+MODELS_DIR = PROJECT_ROOT / "models"
+LOGS_DIR = PROJECT_ROOT / "logs"
+
+# Create directories if they don't exist
+for directory in [DATA_DIR, MODELS_DIR, LOGS_DIR]:
+    directory.mkdir(parents=True, exist_ok=True)
+
+# Model hyperparameters
+class ModelConfig:
+    """Configuration class for model hyperparameters."""
+
+    # Data parameters
+    VOCAB_SIZE = 10000
+    MAX_LENGTH = 300
+
+    # Model architecture parameters
+    EMBEDDING_DIM = 128
+    LSTM_UNITS_1 = 64
+    LSTM_UNITS_2 = 32
+    DROPOUT_RATE = 0.5
+
+    # Training parameters
+    BATCH_SIZE = 128
+    EPOCHS = 5
+    VALIDATION_SPLIT = 0.2
+    LEARNING_RATE = 0.001
+
+    # Model file paths
+    MODEL_PATH = MODELS_DIR / "sentiment_lstm_model.h5"
+    TOKENIZER_PATH = MODELS_DIR / "tokenizer.pkl"
+    HISTORY_PATH = MODELS_DIR / "training_history.json"
+
+    @classmethod
+    def to_dict(cls):
+        """Convert configuration to dictionary."""
+        return {
+            key: getattr(cls, key)
+            for key in dir(cls)
+            if not key.startswith('_') and key.isupper()
+        }
+
+    @classmethod
+    def from_dict(cls, config_dict):
+        """Update configuration from dictionary."""
+        for key, value in config_dict.items():
+            if hasattr(cls, key):
+                setattr(cls, key, value)
diff --git a/src/sentiment_analysis/data_loader.py b/src/sentiment_analysis/data_loader.py
new file mode 100644
index 0000000..ad2ca89
--- /dev/null
+++ b/src/sentiment_analysis/data_loader.py
@@ -0,0 +1,157 @@
+"""
+Data loading and preprocessing utilities.
+"""
+
+import numpy as np
+from tensorflow.keras.datasets import imdb
+from tensorflow.keras.preprocessing.sequence import pad_sequences
+from tensorflow.keras.preprocessing.text import Tokenizer
+import pickle
+import logging
+
+from sentiment_analysis.config import ModelConfig
+
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+
+class DataLoader:
+    """Class for loading and preprocessing data for sentiment analysis."""
+
+    def __init__(self, vocab_size=None, max_length=None):
+        """
+        Initialize the DataLoader.
+
+        Args:
+            vocab_size (int): Maximum number of words to keep in vocabulary
+            max_length (int): Maximum length of sequences
+        """
+        self.vocab_size = vocab_size or ModelConfig.VOCAB_SIZE
+        self.max_length = max_length or ModelConfig.MAX_LENGTH
+        self.tokenizer = None
+        self.word_index = None
+
+    def load_imdb_data(self):
+        """
+        Load and preprocess the IMDB dataset.
+
+        Returns:
+            tuple: (X_train, y_train), (X_test, y_test)
+        """
+        logger.info(f"Loading IMDB dataset with vocab_size={self.vocab_size}")
+
+        # Load the IMDB dataset
+        (X_train, y_train), (X_test, y_test) = imdb.load_data(
+            num_words=self.vocab_size
+        )
+
+        logger.info(f"Loaded {len(X_train)} training samples and {len(X_test)} test samples")
+
+        # Pad sequences to ensure uniform input size
+        X_train = pad_sequences(X_train, maxlen=self.max_length)
+        X_test = pad_sequences(X_test, maxlen=self.max_length)
+
+        # Get word index for reference
+        self.word_index = imdb.get_word_index()
+
+        logger.info(f"Sequences padded to max_length={self.max_length}")
+
+        return (X_train, y_train), (X_test, y_test)
+
+    def preprocess_text(self, text, tokenizer=None):
+        """
+        Preprocess a text string for prediction.
+
+        Args:
+            text (str): Input text to preprocess
+            tokenizer (Tokenizer): Keras tokenizer (optional)
+
+        Returns:
+            np.ndarray: Preprocessed and padded sequence
+        """
+        if tokenizer is None:
+            # Create a new tokenizer if not provided
+            tokenizer = Tokenizer(num_words=self.vocab_size)
+            tokenizer.fit_on_texts([text])
+
+        # Convert text to sequence
+        sequence = tokenizer.texts_to_sequences([text])
+
+        # Pad sequence
+        padded = pad_sequences(sequence, maxlen=self.max_length)
+
+        return padded
+
+    def save_tokenizer(self, tokenizer, path):
+        """
+        Save tokenizer to file.
+
+        Args:
+            tokenizer: Keras tokenizer object
+            path (str): Path to save the tokenizer
+        """
+        with open(path, 'wb') as f:
+            pickle.dump(tokenizer, f)
+        logger.info(f"Tokenizer saved to {path}")
+
+    def load_tokenizer(self, path):
+        """
+        Load tokenizer from file.
+
+        Args:
+            path (str): Path to the tokenizer file
+
+        Returns:
+            Tokenizer: Loaded tokenizer object
+        """
+        with open(path, 'rb') as f:
+            tokenizer = pickle.load(f)
+        logger.info(f"Tokenizer loaded from {path}")
+        return tokenizer
+
+    def decode_review(self, encoded_review):
+        """
+        Decode an encoded review back to text.
+
+        Args:
+            encoded_review (list): List of word indices
+
+        Returns:
+            str: Decoded text
+        """
+        if self.word_index is None:
+            self.word_index = imdb.get_word_index()
+
+        # Reverse word index
+        reverse_word_index = {value: key for key, value in self.word_index.items()}
+
+        # Decode the review (indices are offset by 3)
+        decoded = ' '.join([
+            reverse_word_index.get(i - 3, '?') for i in encoded_review
+        ])
+
+        return decoded
+
+    def get_data_statistics(self, X_train, y_train, X_test, y_test):
+        """
+        Get statistics about the dataset.
+
+        Args:
+            X_train, y_train: Training data
+            X_test, y_test: Test data
+
+        Returns:
+            dict: Dictionary containing dataset statistics
+        """
+        stats = {
+            'train_samples': len(X_train),
+            'test_samples': len(X_test),
+            'train_positive': np.sum(y_train == 1),
+            'train_negative': np.sum(y_train == 0),
+            'test_positive': np.sum(y_test == 1),
+            'test_negative': np.sum(y_test == 0),
+            'sequence_length': X_train.shape[1] if len(X_train.shape) > 1 else 0,
+            'vocab_size': self.vocab_size
+        }
+
+        return stats
diff --git a/src/sentiment_analysis/model.py b/src/sentiment_analysis/model.py
new file mode 100644
index 0000000..0ebaf79
--- /dev/null
+++ b/src/sentiment_analysis/model.py
@@ -0,0 +1,190 @@
+"""
+LSTM model architecture for sentiment analysis.
+"""
+
+from tensorflow.keras.models import Sequential, load_model
+from tensorflow.keras.layers import (
+    Embedding, LSTM, Dense, Dropout, Bidirectional, SpatialDropout1D
+)
+from tensorflow.keras.optimizers import Adam
+from tensorflow.keras.callbacks import EarlyStopping, ModelCheckpoint, ReduceLROnPlateau
+import logging
+
+from sentiment_analysis.config import ModelConfig
+
+logging.basicConfig(level=logging.INFO)
+logger = logging.getLogger(__name__)
+
+
+class SentimentLSTM:
+    """LSTM-based model for sentiment analysis."""
+
+    def __init__(self, config=None):
+        """
+        Initialize the sentiment analysis model.
+
+        Args:
+            config (ModelConfig): Configuration object with hyperparameters
+        """
+        self.config = config or ModelConfig()
+        self.model = None
+
+    def build_model(self, bidirectional=True, spatial_dropout=False):
+        """
+        Build the LSTM model architecture.
+
+        Args:
+            bidirectional (bool): Whether to use bidirectional LSTM
+            spatial_dropout (bool): Whether to use spatial dropout
+
+        Returns:
+            Sequential: Compiled Keras model
+        """
+        logger.info("Building LSTM model...")
+
+        model = Sequential(name='sentiment_lstm')
+
+        # Embedding layer
+        model.add(Embedding(
+            input_dim=self.config.VOCAB_SIZE,
+            output_dim=self.config.EMBEDDING_DIM,
+            input_length=self.config.MAX_LENGTH,
+            name='embedding'
+        ))
+
+        # Optional spatial dropout
+        if spatial_dropout:
+            model.add(SpatialDropout1D(0.2, name='spatial_dropout'))
+
+        # First LSTM layer (bidirectional option)
+        if bidirectional:
+            model.add(Bidirectional(
+                LSTM(self.config.LSTM_UNITS_1, return_sequences=True),
+                name='bidirectional_lstm_1'
+            ))
+        else:
+            model.add(LSTM(
+                self.config.LSTM_UNITS_1,
+                return_sequences=True,
+                name='lstm_1'
+            ))
+
+        # Dropout for regularization
+        model.add(Dropout(self.config.DROPOUT_RATE, name='dropout_1'))
+
+        # Second LSTM layer
+        model.add(LSTM(self.config.LSTM_UNITS_2, name='lstm_2'))
+
+        # Output layer for binary classification
+        model.add(Dense(1, activation='sigmoid', name='output'))
+
+        # Compile the model
+        optimizer = Adam(learning_rate=self.config.LEARNING_RATE)
+        model.compile(
+            optimizer=optimizer,
+            loss='binary_crossentropy',
+            metrics=['accuracy']
+        )
+
+        self.model = model
+
+        logger.info("Model built successfully")
+        logger.info(f"Total parameters: {model.count_params():,}")
+
+        return model
+
+    def get_model_summary(self):
+        """
+        Get a summary of the model architecture.
+
+        Returns:
+            str: Model summary as string
+        """
+        if self.model is None:
+            return "Model not built yet"
+
+        summary_list = []
+        self.model.summary(print_fn=lambda x: summary_list.append(x))
+        return '\n'.join(summary_list)
+
+    def get_callbacks(self, patience=3):
+        """
+        Get training callbacks.
+
+        Args:
+            patience (int): Patience for early stopping
+
+        Returns:
+            list: List of Keras callbacks
+        """
+        callbacks = [
+            EarlyStopping(
+                monitor='val_loss',
+                patience=patience,
+                restore_best_weights=True,
+                verbose=1
+            ),
+            ModelCheckpoint(
+                filepath=str(self.config.MODEL_PATH),
+                monitor='val_accuracy',
+                save_best_only=True,
+                verbose=1
+            ),
+            ReduceLROnPlateau(
+                monitor='val_loss',
+                factor=0.5,
+                patience=2,
+                min_lr=1e-7,
+                verbose=1
+            )
+        ]
+
+        return callbacks
+
+    def save_model(self, path=None):
+        """
+        Save the trained model.
+
+        Args:
+            path (str): Path to save the model
+        """
+        if self.model is None:
+            raise ValueError("No model to save. Build and train the model first.")
+
+        save_path = path or self.config.MODEL_PATH
+        self.model.save(save_path)
+        logger.info(f"Model saved to {save_path}")
+
+    def load_model(self, path=None):
+        """
+        Load a trained model.
+
+        Args:
+            path (str): Path to the saved model
+
+        Returns:
+            Sequential: Loaded Keras model
+        """
+        load_path = path or self.config.MODEL_PATH
+        self.model = load_model(load_path)
+        logger.info(f"Model loaded from {load_path}")
+        return self.model
+
+    def predict_sentiment(self, preprocessed_text):
+        """
+        Predict sentiment for preprocessed text.
+
+        Args:
+            preprocessed_text (np.ndarray): Preprocessed and padded text
+
+        Returns:
+            tuple: (prediction score, sentiment label)
+        """
+        if self.model is None:
+            raise ValueError("Model not loaded. Load or build a model first.")
+
+        prediction = self.model.predict(preprocessed_text, verbose=0)
+        score = float(prediction[0][0])
+        sentiment = "Positive" if score > 0.5 else "Negative"
+
+        return score, sentiment
diff --git a/src/sentiment_analysis/predict.py b/src/sentiment_analysis/predict.py
new file mode 100644
index 0000000..e70e76d
--- /dev/null
+++ b/src/sentiment_analysis/predict.py
@@ -0,0 +1,190 @@
+"""
+Prediction utilities for the sentiment analysis model.
+"""
+
+import logging
+import numpy as np
+from pathlib import Path
+
+from sentiment_analysis.model import SentimentLSTM
+from sentiment_analysis.data_loader import DataLoader
+from sentiment_analysis.config import ModelConfig
+from sentiment_analysis.utils import setup_logger
+
+logger = setup_logger(__name__)
+
+
+class Predictor:
+    """Class for making predictions with the sentiment analysis model."""
+
+    def __init__(self, model_path=None, config=None):
+        """
+        Initialize the Predictor.
+
+        Args:
+            model_path (str): Path to the saved model
+            config (ModelConfig): Configuration object
+        """
+        self.config = config or ModelConfig()
+        self.model_path = model_path or self.config.MODEL_PATH
+
+        # Initialize model and data loader
+        self.sentiment_model = SentimentLSTM(self.config)
+        self.data_loader = DataLoader(
+            vocab_size=self.config.VOCAB_SIZE,
+            max_length=self.config.MAX_LENGTH
+        )
+
+        # Load the model if it exists
+        if Path(self.model_path).exists():
+            self.load_model()
+        else:
+            logger.warning(f"Model not found at {self.model_path}")
+
+    def load_model(self):
+        """Load the trained model."""
+        logger.info(f"Loading model from {self.model_path}")
+        self.sentiment_model.load_model(self.model_path)
+
+    def predict_text(self, text):
+        """
+        Predict sentiment for a single text.
+
+        Args:
+            text (str): Input text
+
+        Returns:
+            dict: Prediction results with score and sentiment
+        """
+        if self.sentiment_model.model is None:
+            raise ValueError("Model not loaded. Train or load a model first.")
+
+        # Preprocess the text
+        preprocessed = self.data_loader.preprocess_text(text)
+
+        # Make prediction
+        score, sentiment = self.sentiment_model.predict_sentiment(preprocessed)
+
+        result = {
+            'text': text,
+            'score': score,
+            'sentiment': sentiment,
+            'confidence': abs(score - 0.5) * 2  # Normalize confidence to 0-1
+        }
+
+        return result
+
+    def predict_batch(self, texts):
+        """
+        Predict sentiment for multiple texts.
+
+        Args:
+            texts (list): List of input texts
+
+        Returns:
+            list: List of prediction results
+        """
+        results = []
+
+        logger.info(f"Predicting sentiment for {len(texts)} texts...")
+
+        for text in texts:
+            result = self.predict_text(text)
+            results.append(result)
+
+        return results
+
+    def predict_with_explanation(self, text, top_k=10):
+        """
+        Predict sentiment with word importance explanation.
+
+        Args:
+            text (str): Input text
+            top_k (int): Number of top important words to return
+
+        Returns:
+            dict: Prediction results with word importance
+        """
+        # Get base prediction
+        result = self.predict_text(text)
+
+        # TODO: Implement gradient-based or attention-based word importance
+        # This is a placeholder for future enhancement
+        result['explanation'] = "Word importance analysis not yet implemented"
+
+        return result
+
+    def evaluate_model(self, X_test, y_test):
+        """
+        Evaluate the model on a test set.
+
+        Args:
+            X_test (np.ndarray): Test data
+            y_test (np.ndarray): Test labels
+
+        Returns:
+            dict: Evaluation metrics
+        """
+        if self.sentiment_model.model is None:
+            raise ValueError("Model not loaded. Train or load a model first.")
+
+        logger.info("Evaluating model...")
+
+        # Evaluate
+        test_loss, test_accuracy = self.sentiment_model.model.evaluate(
+            X_test, y_test, verbose=0
+        )
+
+        # Get predictions for detailed metrics
+        predictions = self.sentiment_model.model.predict(X_test, verbose=0)
+        predictions_binary = (predictions > 0.5).astype(int).flatten()
+
+        # Calculate additional metrics
+        from sklearn.metrics import classification_report, confusion_matrix
+
+        conf_matrix = confusion_matrix(y_test, predictions_binary)
+        class_report = classification_report(
+            y_test, predictions_binary,
+            target_names=['Negative', 'Positive'],
+            output_dict=True
+        )
+
+        results = {
+            'test_loss': float(test_loss),
+            'test_accuracy': float(test_accuracy),
+            'confusion_matrix': conf_matrix.tolist(),
+            'classification_report': class_report
+        }
+
+        logger.info(f"Test Accuracy: {test_accuracy:.4f}")
+        logger.info(f"Test Loss: {test_loss:.4f}")
+
+        return results
+
+    def predict_examples(self):
+        """
+        Run predictions on example texts.
+
+        Returns:
+            list: List of prediction results
+        """
+        example_texts = [
+            "This movie was fantastic! I really enjoyed the story and the acting was superb.",
+            "Terrible movie. Waste of time and money. Do not watch.",
+            "It was okay. Nothing special but not terrible either.",
+            "Absolutely brilliant! One of the best films I've ever seen.",
+            "Boring and predictable. The plot was full of holes.",
+            "Great performances by the cast. Highly recommended!",
+            "Disappointing. Had high expectations but it fell flat.",
+            "A masterpiece of cinema. Stunning visuals and storytelling.",
+        ]
+
+        logger.info("Running predictions on example texts...")
+        results = self.predict_batch(example_texts)
+
+        # Print results
+        for result in results:
+            logger.info(f"\nText: {result['text'][:60]}...")
+            logger.info(f"Sentiment: {result['sentiment']} (Score: {result['score']:.4f}, Confidence: {result['confidence']:.4f})")
+
+        return results
diff --git a/src/sentiment_analysis/train.py b/src/sentiment_analysis/train.py
new file mode 100644
index 0000000..8123880
--- /dev/null
+++ b/src/sentiment_analysis/train.py
@@ -0,0 +1,198 @@
+"""
+Training utilities for the sentiment analysis model.
+"""
+
+import json
+import logging
+from pathlib import Path
+import numpy as np
+
+from sentiment_analysis.model import SentimentLSTM
+from sentiment_analysis.data_loader import DataLoader
+from sentiment_analysis.config import ModelConfig
+from sentiment_analysis.utils import setup_logger
+
+logger = setup_logger(__name__)
+
+
+class Trainer:
+    """Class for training the sentiment analysis model."""
+
+    def __init__(self, config=None):
+        """
+        Initialize the Trainer.
+
+        Args:
+            config (ModelConfig): Configuration object
+        """
+        self.config = config or ModelConfig()
+        self.model = None
+        self.data_loader = DataLoader(
+            vocab_size=self.config.VOCAB_SIZE,
+            max_length=self.config.MAX_LENGTH
+        )
+        self.history = None
+
+    def prepare_data(self):
+        """
+        Prepare the dataset for training.
+
+        Returns:
+            tuple: Training and test data
+        """
+        logger.info("Preparing data...")
+        (X_train, y_train), (X_test, y_test) = self.data_loader.load_imdb_data()
+
+        # Log data statistics
+        stats = self.data_loader.get_data_statistics(X_train, y_train, X_test, y_test)
+        logger.info(f"Data statistics: {stats}")
+
+        return (X_train, y_train), (X_test, y_test)
+
+    def train(
+        self,
+        X_train,
+        y_train,
+        X_test=None,
+        y_test=None,
+        epochs=None,
+        batch_size=None,
+        validation_split=None,
+        bidirectional=True,
+        spatial_dropout=False,
+        patience=3,
+        verbose=2
+    ):
+        """
+        Train the sentiment analysis model.
+
+        Args:
+            X_train (np.ndarray): Training data
+            y_train (np.ndarray): Training labels
+            X_test (np.ndarray): Test data (optional)
+            y_test (np.ndarray): Test labels (optional)
+            epochs (int): Number of training epochs
+            batch_size (int): Batch size for training
+            validation_split (float): Fraction of data to use for validation
+            bidirectional (bool): Whether to use bidirectional LSTM
+            spatial_dropout (bool): Whether to use spatial dropout
+            patience (int): Patience for early stopping
+            verbose (int): Verbosity mode
+
+        Returns:
+            dict: Training history
+        """
+        # Use config defaults if not specified
+        epochs = epochs or self.config.EPOCHS
+        batch_size = batch_size or self.config.BATCH_SIZE
+        validation_split = validation_split or self.config.VALIDATION_SPLIT
+
+        logger.info("Starting training...")
+        logger.info(f"Epochs: {epochs}, Batch size: {batch_size}, Validation split: {validation_split}")
+
+        # Build the model
+        sentiment_model = SentimentLSTM(self.config)
+        sentiment_model.build_model(
+            bidirectional=bidirectional,
+            spatial_dropout=spatial_dropout
+        )
+        self.model = sentiment_model
+
+        # Get callbacks
+        callbacks = sentiment_model.get_callbacks(patience=patience)
+
+        # Train the model
+        history = sentiment_model.model.fit(
+            X_train,
+            y_train,
+            epochs=epochs,
+            batch_size=batch_size,
+            validation_split=validation_split,
+            callbacks=callbacks,
+            verbose=verbose
+        )
+
+        self.history = history.history
+
+        # Evaluate on test set if provided
+        if X_test is not None and y_test is not None:
+            logger.info("Evaluating on test set...")
+            test_loss, test_accuracy = sentiment_model.model.evaluate(
+                X_test, y_test, verbose=0
+            )
+            logger.info(f"Test Loss: {test_loss:.4f}")
+            logger.info(f"Test Accuracy: {test_accuracy:.4f}")
+
+            # Add test metrics to history
+            self.history['test_loss'] = test_loss
+            self.history['test_accuracy'] = test_accuracy
+
+        # Save the model
+        sentiment_model.save_model()
+
+        # Save training history
+        self.save_history()
+
+        logger.info("Training completed successfully")
+
+        return self.history
+
+    def save_history(self, path=None):
+        """
+        Save training history to JSON file.
+
+        Args:
+            path (str): Path to save the history
+        """
+        if self.history is None:
+            logger.warning("No training history to save")
+            return
+
+        save_path = path or self.config.HISTORY_PATH
+
+        # Convert numpy types to native Python types for JSON serialization
+        history_serializable = {}
+        for key, value in self.history.items():
+            if isinstance(value, (list, np.ndarray)):
+                history_serializable[key] = [float(v) for v in value]
+            else:
+                history_serializable[key] = float(value)
+
+        with open(save_path, 'w') as f:
+            json.dump(history_serializable, f, indent=2)
+
+        logger.info(f"Training history saved to {save_path}")
+
+    def load_history(self, path=None):
+        """
+        Load training history from JSON file.
+
+        Args:
+            path (str): Path to the history file
+
+        Returns:
+            dict: Training history
+        """
+        load_path = path or self.config.HISTORY_PATH
+
+        with open(load_path, 'r') as f:
+            self.history = json.load(f)
+
+        logger.info(f"Training history loaded from {load_path}")
+        return self.history
+
+    def get_best_epoch(self):
+        """
+        Get the epoch with the best validation accuracy.
+
+        Returns:
+            tuple: (best_epoch, best_val_accuracy)
+        """
+        if self.history is None or 'val_accuracy' not in self.history:
+            return None, None
+
+        val_accuracies = self.history['val_accuracy']
+        best_epoch = np.argmax(val_accuracies)
+        best_val_accuracy = val_accuracies[best_epoch]
+
+        return best_epoch + 1, best_val_accuracy
diff --git a/src/sentiment_analysis/utils.py b/src/sentiment_analysis/utils.py
new file mode 100644
index 0000000..5598a61
--- /dev/null
+++ b/src/sentiment_analysis/utils.py
@@ -0,0 +1,207 @@
+"""
+Utility functions for the sentiment analysis project.
+"""
+
+import logging
+import json
+import os
+from pathlib import Path
+import numpy as np
+from datetime import datetime
+
+
+def setup_logger(name, level=logging.INFO):
+    """
+    Set up a logger with the specified name and level.
+
+    Args:
+        name (str): Logger name
+        level: Logging level
+
+    Returns:
+        logging.Logger: Configured logger
+    """
+    logger = logging.getLogger(name)
+
+    if not logger.handlers:
+        # Create handler
+        handler = logging.StreamHandler()
+        handler.setLevel(level)
+
+        # Create formatter
+        formatter = logging.Formatter(
+            '%(asctime)s - %(name)s - %(levelname)s - %(message)s',
+            datefmt='%Y-%m-%d %H:%M:%S'
+        )
+        handler.setFormatter(formatter)
+
+        # Add handler to logger
+        logger.addHandler(handler)
+        logger.setLevel(level)
+
+    return logger
+
+
+def save_json(data, filepath):
+    """
+    Save data to a JSON file.
+
+    Args:
+        data (dict): Data to save
+        filepath (str): Path to save the file
+    """
+    with open(filepath, 'w') as f:
+        json.dump(data, f, indent=2)
+
+
+def load_json(filepath):
+    """
+    Load data from a JSON file.
+
+    Args:
+        filepath (str): Path to the JSON file
+
+    Returns:
+        dict: Loaded data
+    """
+    with open(filepath, 'r') as f:
+        return json.load(f)
+
+
+def ensure_dir(directory):
+    """
+    Ensure that a directory exists.
+
+    Args:
+        directory (str): Directory path
+    """
+    Path(directory).mkdir(parents=True, exist_ok=True)
+
+
+def get_timestamp():
+    """
+    Get current timestamp as string.
+
+    Returns:
+        str: Timestamp in format YYYYMMDD_HHMMSS
+    """
+    return datetime.now().strftime('%Y%m%d_%H%M%S')
+
+
+def calculate_metrics(y_true, y_pred):
+    """
+    Calculate classification metrics.
+
+    Args:
+        y_true (np.ndarray): True labels
+        y_pred (np.ndarray): Predicted labels
+
+    Returns:
+        dict: Dictionary of metrics
+    """
+    from sklearn.metrics import accuracy_score, precision_score, recall_score, f1_score
+
+    metrics = {
+        'accuracy': accuracy_score(y_true, y_pred),
+        'precision': precision_score(y_true, y_pred),
+        'recall': recall_score(y_true, y_pred),
+        'f1_score': f1_score(y_true, y_pred)
+    }
+
+    return metrics
+
+
+def format_time(seconds):
+    """
+    Format seconds into human-readable time string.
+
+    Args:
+        seconds (float): Time in seconds
+
+    Returns:
+        str: Formatted time string
+    """
+    if seconds < 60:
+        return f"{seconds:.1f}s"
+    elif seconds < 3600:
+        minutes = seconds / 60
+        return f"{minutes:.1f}m"
+    else:
+        hours = seconds / 3600
+        return f"{hours:.1f}h"
+
+
+def print_section(title, width=70):
+    """
+    Print a formatted section title.
+
+    Args:
+        title (str): Section title
+        width (int): Width of the section
+    """
+    print("\n" + "=" * width)
+    print(f" {title} ".center(width, "="))
+    print("=" * width + "\n")
+
+
+class EarlyStoppingMonitor:
+    """Monitor for implementing custom early stopping logic."""
+
+    def __init__(self, patience=5, min_delta=0.001):
+        """
+        Initialize the early stopping monitor.
+
+        Args:
+            patience (int): Number of epochs to wait before stopping
+            min_delta (float): Minimum change to qualify as an improvement
+        """
+        self.patience = patience
+        self.min_delta = min_delta
+        self.counter = 0
+        self.best_loss = None
+        self.should_stop = False
+
+    def __call__(self, val_loss):
+        """
+        Check if training should stop.
+
+        Args:
+            val_loss (float): Current validation loss
+
+        Returns:
+            bool: Whether to stop training
+        """
+        if self.best_loss is None:
+            self.best_loss = val_loss
+        elif val_loss > self.best_loss - self.min_delta:
+            self.counter += 1
+            if self.counter >= self.patience:
+                self.should_stop = True
+        else:
+            self.best_loss = val_loss
+            self.counter = 0
+
+        return self.should_stop
+
+
+def seed_everything(seed=42):
+    """
+    Set random seeds for reproducibility.
+
+    Args:
+        seed (int): Random seed
+    """
+    os.environ['PYTHONHASHSEED'] = str(seed)
+    np.random.seed(seed)
+
+    try:
+        import tensorflow as tf
+        tf.random.set_seed(seed)
+    except ImportError:
+        pass
+
+    try:
+        import random
+        random.seed(seed)
+    except ImportError:
+        pass
diff --git a/src/sentiment_analysis/visualization.py b/src/sentiment_analysis/visualization.py
new file mode 100644
index 0000000..f50da1d
--- /dev/null
+++ b/src/sentiment_analysis/visualization.py
@@ -0,0 +1,241 @@
+"""
+Visualization utilities for model training and evaluation.
+"""
+
+import matplotlib.pyplot as plt
+import seaborn as sns
+import numpy as np
+from pathlib import Path
+import logging
+
+from sentiment_analysis.utils import setup_logger
+
+logger = setup_logger(__name__)
+
+# Set style for better-looking plots
+sns.set_style("whitegrid")
+plt.rcParams['figure.figsize'] = (12, 8)
+
+
+class Visualizer:
+    """Class for creating visualizations of training and evaluation results."""
+
+    def __init__(self, output_dir='outputs'):
+        """
+        Initialize the Visualizer.
+
+        Args:
+            output_dir (str): Directory to save plots
+        """
+        self.output_dir = Path(output_dir)
+        self.output_dir.mkdir(parents=True, exist_ok=True)
+
+    def plot_training_history(self, history, save_path=None):
+        """
+        Plot training and validation accuracy and loss.
+
+        Args:
+            history (dict): Training history dictionary
+            save_path (str): Path to save the plot
+        """
+        fig, axes = plt.subplots(1, 2, figsize=(14, 5))
+
+        # Plot accuracy
+        if 'accuracy' in history:
+            axes[0].plot(history['accuracy'], label='Training Accuracy', linewidth=2)
+        if 'val_accuracy' in history:
+            axes[0].plot(history['val_accuracy'], label='Validation Accuracy', linewidth=2)
+
+        axes[0].set_title('Model Accuracy', fontsize=14, fontweight='bold')
+        axes[0].set_xlabel('Epoch', fontsize=12)
+        axes[0].set_ylabel('Accuracy', fontsize=12)
+        axes[0].legend(loc='lower right', fontsize=10)
+        axes[0].grid(True, alpha=0.3)
+
+        # Plot loss
+        if 'loss' in history:
+            axes[1].plot(history['loss'], label='Training Loss', linewidth=2)
+        if 'val_loss' in history:
+            axes[1].plot(history['val_loss'], label='Validation Loss', linewidth=2)
+
+        axes[1].set_title('Model Loss', fontsize=14, fontweight='bold')
+        axes[1].set_xlabel('Epoch', fontsize=12)
+        axes[1].set_ylabel('Loss', fontsize=12)
+        axes[1].legend(loc='upper right', fontsize=10)
+        axes[1].grid(True, alpha=0.3)
+
+        plt.tight_layout()
+
+        if save_path:
+            plt.savefig(save_path, dpi=300, bbox_inches='tight')
+            logger.info(f"Training history plot saved to {save_path}")
+        else:
+            save_path = self.output_dir / 'training_history.png'
+            plt.savefig(save_path, dpi=300, bbox_inches='tight')
+            logger.info(f"Training history plot saved to {save_path}")
+
+        plt.show()
+
+        return fig
+
+    def plot_confusion_matrix(self, confusion_matrix, labels=None, save_path=None):
+        """
+        Plot confusion matrix.
+
+        Args:
+            confusion_matrix (np.ndarray): Confusion matrix
+            labels (list): Class labels
+            save_path (str): Path to save the plot
+        """
+        if labels is None:
+            labels = ['Negative', 'Positive']
+
+        plt.figure(figsize=(8, 6))
+        sns.heatmap(
+            confusion_matrix,
+            annot=True,
+            fmt='d',
+            cmap='Blues',
+            xticklabels=labels,
+            yticklabels=labels,
+            cbar_kws={'label': 'Count'}
+        )
+
+        plt.title('Confusion Matrix', fontsize=14, fontweight='bold', pad=20)
+        plt.ylabel('True Label', fontsize=12)
+        plt.xlabel('Predicted Label', fontsize=12)
+        plt.tight_layout()
+
+        if save_path:
+            plt.savefig(save_path, dpi=300, bbox_inches='tight')
+            logger.info(f"Confusion matrix saved to {save_path}")
+        else:
+            save_path = self.output_dir / 'confusion_matrix.png'
+            plt.savefig(save_path, dpi=300, bbox_inches='tight')
+            logger.info(f"Confusion matrix saved to {save_path}")
+
+        plt.show()
+
+    def plot_prediction_distribution(self, predictions, labels=None, save_path=None):
+        """
+        Plot distribution of prediction scores.
+
+        Args:
+            predictions (np.ndarray): Prediction scores
+            labels (np.ndarray): True labels (optional)
+            save_path (str): Path to save the plot
+        """
+        fig, ax = plt.subplots(figsize=(10, 6))
+
+        if labels is not None:
+            # Plot separate distributions for positive and negative samples
+            pos_preds = predictions[labels == 1]
+            neg_preds = predictions[labels == 0]
+
+            ax.hist(neg_preds, bins=50, alpha=0.6, label='Negative Samples', color='red')
+            ax.hist(pos_preds, bins=50, alpha=0.6, label='Positive Samples', color='green')
+            ax.legend(fontsize=10)
+        else:
+            ax.hist(predictions, bins=50, alpha=0.7, color='blue')
+
+        ax.axvline(x=0.5, color='black', linestyle='--', linewidth=2, label='Decision Boundary')
+        ax.set_title('Prediction Score Distribution', fontsize=14, fontweight='bold')
+        ax.set_xlabel('Prediction Score', fontsize=12)
+        ax.set_ylabel('Frequency', fontsize=12)
+        ax.grid(True, alpha=0.3)
+
+        plt.tight_layout()
+
+        if save_path:
+            plt.savefig(save_path, dpi=300, bbox_inches='tight')
+            logger.info(f"Prediction distribution saved to {save_path}")
+        else:
+            save_path = self.output_dir / 'prediction_distribution.png'
+            plt.savefig(save_path, dpi=300, bbox_inches='tight')
+            logger.info(f"Prediction distribution saved to {save_path}")
+
+        plt.show()
+
+    def plot_roc_curve(self, y_true, y_pred_proba, save_path=None):
+        """
+        Plot ROC curve.
+
+        Args:
+            y_true (np.ndarray): True labels
+            y_pred_proba (np.ndarray): Predicted probabilities
+            save_path (str): Path to save the plot
+        """
+        from sklearn.metrics import roc_curve, auc
+
+        fpr, tpr, _ = roc_curve(y_true, y_pred_proba)
+        roc_auc = auc(fpr, tpr)
+
+        plt.figure(figsize=(8, 6))
+        plt.plot(
+            fpr, tpr,
+            color='darkorange',
+            lw=2,
+            label=f'ROC curve (AUC = {roc_auc:.3f})'
+        )
+        plt.plot([0, 1], [0, 1], color='navy', lw=2, linestyle='--', label='Random Classifier')
+
+        plt.xlim([0.0, 1.0])
+        plt.ylim([0.0, 1.05])
+        plt.xlabel('False Positive Rate', fontsize=12)
+        plt.ylabel('True Positive Rate', fontsize=12)
+        plt.title('Receiver Operating Characteristic (ROC) Curve', fontsize=14, fontweight='bold')
+        plt.legend(loc='lower right', fontsize=10)
+        plt.grid(True, alpha=0.3)
+        plt.tight_layout()
+
+        if save_path:
+            plt.savefig(save_path, dpi=300, bbox_inches='tight')
+            logger.info(f"ROC curve saved to {save_path}")
+        else:
+            save_path = self.output_dir / 'roc_curve.png'
+            plt.savefig(save_path, dpi=300, bbox_inches='tight')
+            logger.info(f"ROC curve saved to {save_path}")
+
+        plt.show()
+
+    def plot_metrics_comparison(self, metrics_dict, save_path=None):
+        """
+        Plot comparison of multiple metrics.
+
+        Args:
+            metrics_dict (dict): Dictionary of metrics
+            save_path (str): Path to save the plot
+        """
+        metrics_names = list(metrics_dict.keys())
+        metrics_values = list(metrics_dict.values())
+
+        plt.figure(figsize=(10, 6))
+        bars = plt.bar(metrics_names, metrics_values, color='steelblue', alpha=0.7)
+
+        # Add value labels on bars
+        for bar in bars:
+            height = bar.get_height()
+            plt.text(
+                bar.get_x() + bar.get_width() / 2.,
+                height,
+                f'{height:.4f}',
+                ha='center',
+                va='bottom',
+                fontsize=10
+            )
+
+        plt.title('Model Performance Metrics', fontsize=14, fontweight='bold')
+        plt.ylabel('Score', fontsize=12)
+        plt.ylim([0, 1])
+        plt.grid(True, alpha=0.3, axis='y')
+        plt.tight_layout()
+
+        if save_path:
+            plt.savefig(save_path, dpi=300, bbox_inches='tight')
+            logger.info(f"Metrics comparison saved to {save_path}")
+        else:
+            save_path = self.output_dir / 'metrics_comparison.png'
+            plt.savefig(save_path, dpi=300, bbox_inches='tight')
+            logger.info(f"Metrics comparison saved to {save_path}")
+
+        plt.show()
diff --git a/tests/__init__.py b/tests/__init__.py
new file mode 100644
index 0000000..32df82b
--- /dev/null
+++ b/tests/__init__.py
@@ -0,0 +1 @@
+"""Unit tests for the sentiment analysis package."""
diff --git a/tests/conftest.py b/tests/conftest.py
new file mode 100644
index 0000000..7eab4a0
--- /dev/null
+++ b/tests/conftest.py
@@ -0,0 +1,26 @@
+"""Pytest configuration and fixtures."""
+
+import pytest
+import numpy as np
+
+
+@pytest.fixture
+def sample_texts():
+    """Sample texts for testing."""
+    return [
+        "This movie was fantastic!",
+        "Terrible waste of time.",
+        "It was okay, nothing special.",
+    ]
+
+
+@pytest.fixture
+def sample_labels():
+    """Sample labels for testing."""
+    return np.array([1, 0, 0])
+
+
+@pytest.fixture
+def sample_sequences():
+    """Sample sequences for testing."""
+    return np.random.randint(0, 1000, (10, 100))
diff --git a/tests/test_config.py b/tests/test_config.py
new file mode 100644
index 0000000..d0da326
--- /dev/null
+++ b/tests/test_config.py
@@ -0,0 +1,44 @@
+"""Tests for configuration module."""
+
+import pytest
+from sentiment_analysis.config import ModelConfig, DATA_DIR, MODELS_DIR
+
+
+class TestModelConfig:
+    """Test cases for ModelConfig class."""
+
+    def test_config_attributes(self):
+        """Test that config has required attributes."""
+        assert hasattr(ModelConfig, 'VOCAB_SIZE')
+        assert hasattr(ModelConfig, 'MAX_LENGTH')
+        assert hasattr(ModelConfig, 'EMBEDDING_DIM')
+        assert hasattr(ModelConfig, 'BATCH_SIZE')
+        assert hasattr(ModelConfig, 'EPOCHS')
+
+    def test_config_values(self):
+        """Test that config values are correct types."""
+        assert isinstance(ModelConfig.VOCAB_SIZE, int)
+        assert isinstance(ModelConfig.MAX_LENGTH, int)
+        assert isinstance(ModelConfig.BATCH_SIZE, int)
+        assert isinstance(ModelConfig.EPOCHS, int)
+        assert isinstance(ModelConfig.DROPOUT_RATE, float)
+
+    def test_config_to_dict(self):
+        """Test converting config to dictionary."""
+        config_dict = ModelConfig.to_dict()
+        assert isinstance(config_dict, dict)
+        assert 'VOCAB_SIZE' in config_dict
+        assert 'MAX_LENGTH' in config_dict
+
+    def test_config_from_dict(self):
+        """Test updating config from dictionary."""
+        original_vocab = ModelConfig.VOCAB_SIZE
+        ModelConfig.from_dict({'VOCAB_SIZE': 5000})
+        assert ModelConfig.VOCAB_SIZE == 5000
+        # Reset
+        ModelConfig.VOCAB_SIZE = original_vocab
+
+    def test_directories_exist(self):
+        """Test that required directories are created."""
+        assert DATA_DIR.exists()
+        assert MODELS_DIR.exists()
diff --git a/tests/test_data_loader.py b/tests/test_data_loader.py
new file mode 100644
index 0000000..bcc2361
--- /dev/null
+++ b/tests/test_data_loader.py
@@ -0,0 +1,54 @@
+"""Tests for data loader module."""
+
+import pytest
+import numpy as np
+from sentiment_analysis.data_loader import DataLoader
+
+
+class TestDataLoader:
+    """Test cases for DataLoader class."""
+
+    @pytest.fixture
+    def data_loader(self):
+        """Create a DataLoader instance."""
+        return DataLoader(vocab_size=1000, max_length=100)
+
+    def test_initialization(self, data_loader):
+        """Test DataLoader initialization."""
+        assert data_loader.vocab_size == 1000
+        assert data_loader.max_length == 100
+        assert data_loader.tokenizer is None
+
+    def test_load_imdb_data(self, data_loader):
+        """Test loading IMDB dataset."""
+        (X_train, y_train), (X_test, y_test) = data_loader.load_imdb_data()
+
+        # Check shapes
+        assert len(X_train) > 0
+        assert len(X_test) > 0
+        assert X_train.shape[1] == 100  # max_length
+        assert X_test.shape[1] == 100
+
+        # Check labels
+        assert set(np.unique(y_train)) <= {0, 1}
+        assert set(np.unique(y_test)) <= {0, 1}
+
+    def test_preprocess_text(self, data_loader):
+        """Test text preprocessing."""
+        text = "This is a test review."
+        preprocessed = data_loader.preprocess_text(text)
+
+        assert isinstance(preprocessed, np.ndarray)
+        assert preprocessed.shape[0] == 1
+        assert preprocessed.shape[1] == data_loader.max_length
+
+    def test_get_data_statistics(self, data_loader):
+        """Test getting data statistics."""
+        (X_train, y_train), (X_test, y_test) = data_loader.load_imdb_data()
+        stats = data_loader.get_data_statistics(X_train, y_train, X_test, y_test)
+
+        assert 'train_samples' in stats
+        assert 'test_samples' in stats
+        assert 'vocab_size' in stats
+        assert stats['train_samples'] == len(X_train)
+        assert stats['test_samples'] == len(X_test)
diff --git a/tests/test_model.py b/tests/test_model.py
new file mode 100644
index 0000000..f4364b8
--- /dev/null
+++ b/tests/test_model.py
@@ -0,0 +1,73 @@
+"""Tests for model module."""
+
+import pytest
+import numpy as np
+from sentiment_analysis.model import SentimentLSTM
+from sentiment_analysis.config import ModelConfig
+
+
+class TestSentimentLSTM:
+    """Test cases for SentimentLSTM class."""
+
+    @pytest.fixture
+    def model(self):
+        """Create a SentimentLSTM instance."""
+        return SentimentLSTM()
+
+    def test_initialization(self, model):
+        """Test model initialization."""
+        assert model.config is not None
+        assert model.model is None
+
+    def test_build_model_bidirectional(self, model):
+        """Test building bidirectional LSTM model."""
+        keras_model = model.build_model(bidirectional=True)
+
+        assert keras_model is not None
+        assert len(keras_model.layers) > 0
+        assert keras_model.layers[-1].output_shape == (None, 1)
+
+    def test_build_model_unidirectional(self, model):
+        """Test building unidirectional LSTM model."""
+        keras_model = model.build_model(bidirectional=False)
+
+        assert keras_model is not None
+        assert len(keras_model.layers) > 0
+
+    def test_build_model_with_spatial_dropout(self, model):
+        """Test building model with spatial dropout."""
+        keras_model = model.build_model(spatial_dropout=True)
+
+        assert keras_model is not None
+        # Check that SpatialDropout is in the model
+        layer_names = [layer.__class__.__name__ for layer in keras_model.layers]
+        assert 'SpatialDropout1D' in layer_names
+
+    def test_get_model_summary(self, model):
+        """Test getting model summary."""
+        model.build_model()
+        summary = model.get_model_summary()
+
+        assert isinstance(summary, str)
+        assert len(summary) > 0
+        assert 'lstm' in summary.lower()
+
+    def test_get_callbacks(self, model):
+        """Test getting training callbacks."""
+        callbacks = model.get_callbacks(patience=3)
+
+        assert isinstance(callbacks, list)
+        assert len(callbacks) > 0
+
+    def test_predict_sentiment(self, model):
+        """Test sentiment prediction."""
+        model.build_model()
+
+        # Create dummy input
+        dummy_input = np.random.randint(0, 1000, (1, ModelConfig.MAX_LENGTH))
+
+        score, sentiment = model.predict_sentiment(dummy_input)
+
+        assert isinstance(score, float)
+        assert 0 <= score <= 1
+        assert sentiment in ['Positive', 'Negative']
diff --git a/tests/test_utils.py b/tests/test_utils.py
new file mode 100644
index 0000000..c87352c
--- /dev/null
+++ b/tests/test_utils.py
@@ -0,0 +1,80 @@
+"""Tests for utils module."""
+
+import pytest
+import numpy as np
+from pathlib import Path
+import tempfile
+import json
+
+from sentiment_analysis.utils import (
+    setup_logger,
+    save_json,
+    load_json,
+    ensure_dir,
+    get_timestamp,
+    calculate_metrics,
+    format_time
+)
+
+
+class TestUtils:
+    """Test cases for utility functions."""
+
+    def test_setup_logger(self):
+        """Test logger setup."""
+        logger = setup_logger('test_logger')
+        assert logger is not None
+        assert logger.name == 'test_logger'
+
+    def test_save_and_load_json(self):
+        """Test JSON save and load."""
+        with tempfile.NamedTemporaryFile(mode='w', suffix='.json', delete=False) as f:
+            temp_path = f.name
+
+        try:
+            # Save
+            test_data = {'key': 'value', 'number': 42}
+            save_json(test_data, temp_path)
+
+            # Load
+            loaded_data = load_json(temp_path)
+            assert loaded_data == test_data
+
+        finally:
+            Path(temp_path).unlink(missing_ok=True)
+
+    def test_ensure_dir(self):
+        """Test directory creation."""
+        with tempfile.TemporaryDirectory() as tmpdir:
+            test_dir = Path(tmpdir) / 'test_subdir' / 'nested'
+            ensure_dir(test_dir)
+            assert test_dir.exists()
+            assert test_dir.is_dir()
+
+    def test_get_timestamp(self):
+        """Test timestamp generation."""
+        timestamp = get_timestamp()
+        assert isinstance(timestamp, str)
+        assert len(timestamp) == 15  # YYYYMMDD_HHMMSS
+
+    def test_calculate_metrics(self):
+        """Test metrics calculation."""
+        y_true = np.array([0, 1, 1, 0, 1])
+        y_pred = np.array([0, 1, 0, 0, 1])
+
+        metrics = calculate_metrics(y_true, y_pred)
+
+        assert 'accuracy' in metrics
+        assert 'precision' in metrics
+        assert 'recall' in metrics
+        assert 'f1_score' in metrics
+
+        # Check value ranges
+        for metric_value in metrics.values():
+            assert 0 <= metric_value <= 1
+
+    def test_format_time(self):
+        """Test time formatting."""
+        assert format_time(30) == '30.0s'
+        assert format_time(90) == '1.5m'
+        assert format_time(3600) == '1.0h'

From 9c60e0a0b2436cdb7315be3b6b27ce2ee1c76eee Mon Sep 17 00:00:00 2001
From: Claude <noreply@anthropic.com>
Date: Thu, 13 Nov 2025 18:05:18 +0000
Subject: [PATCH 2/2] Add production-ready infrastructure and features

This commit adds comprehensive production-ready features to transform
the project into an enterprise-grade application.

Docker & Containerization:
- Dockerfile with multi-stage build for optimized images
- docker-compose.yml for orchestrating multiple services
- .dockerignore for efficient builds
- Docker documentation (docs/DOCKER.md)

CI/CD & Automation:
- GitHub Actions workflows for CI/CD pipeline
  * ci.yml - Comprehensive testing, linting, security scans
  * release.yml - Automated package publishing
- Pre-commit hooks for code quality (.pre-commit-config.yaml)
- Makefile with 40+ commands for common development tasks
- Shell scripts for training and API deployment

API & Web Services:
- FastAPI-based REST API (src/sentiment_analysis/api.py)
  * Single and batch prediction endpoints
  * Health check and model info endpoints
  * Comprehensive request/response validation
  * Error handling and logging
  * Swagger/ReDoc documentation
- API documentation (docs/API.md)
- requirements-api.txt for API dependencies

Code Quality & Configuration:
- pyproject.toml for modern Python packaging
- .flake8 configuration for linting
- .editorconfig for consistent coding styles
- Type checking with mypy configured
- Black and isort configurations

Error Handling & Validation:
- Custom exception classes (src/sentiment_analysis/exceptions.py)
  * SentimentAnalysisError (base)
  * ModelNotFoundError
  * DataLoadError
  * InvalidInputError
  * TrainingError
  * PredictionError
  * and more...
- Environment variable support (.env.example)

Security & Best Practices:
- SECURITY.md with security policy and best practices
- GitHub issue templates (bug reports, feature requests)
- Pull request template
- Security scanning in CI/CD
- Dependency vulnerability checking

Documentation:
- CHANGELOG.md for tracking changes
- Comprehensive Docker guide
- API documentation with examples
- Security guidelines

Scripts & Utilities:
- scripts/train_model.sh - Automated training with logging
- scripts/start_api.sh - API server startup script

This infrastructure enables:
- Containerized deployment
- Automated testing and quality checks
- RESTful API for production use
- Professional development workflow
- Security-first approach
- Comprehensive monitoring and logging
---
 .dockerignore                             |  56 ++++
 .editorconfig                             |  36 ++
 .env.example                              |  51 +++
 .flake8                                   |  18 +
 .github/ISSUE_TEMPLATE/bug_report.md      |  39 +++
 .github/ISSUE_TEMPLATE/feature_request.md |  22 ++
 .github/pull_request_template.md          |  34 ++
 .github/workflows/ci.yml                  | 157 +++++++++
 .github/workflows/release.yml             |  43 +++
 .pre-commit-config.yaml                   |  83 +++++
 CHANGELOG.md                              |  76 +++++
 Dockerfile                                |  66 ++++
 Makefile                                  | 159 +++++++++
 SECURITY.md                               | 128 +++++++
 docker-compose.yml                        |  81 +++++
 docs/API.md                               | 392 ++++++++++++++++++++++
 docs/DOCKER.md                            | 378 +++++++++++++++++++++
 pyproject.toml                            | 112 +++++++
 requirements-api.txt                      |   5 +
 scripts/start_api.sh                      |  39 +++
 scripts/train_model.sh                    |  43 +++
 src/sentiment_analysis/api.py             | 317 +++++++++++++++++
 src/sentiment_analysis/exceptions.py      |  66 ++++
 23 files changed, 2401 insertions(+)
 create mode 100644 .dockerignore
 create mode 100644 .editorconfig
 create mode 100644 .env.example
 create mode 100644 .flake8
 create mode 100644 .github/ISSUE_TEMPLATE/bug_report.md
 create mode 100644 .github/ISSUE_TEMPLATE/feature_request.md
 create mode 100644 .github/pull_request_template.md
 create mode 100644 .github/workflows/ci.yml
 create mode 100644 .github/workflows/release.yml
 create mode 100644 .pre-commit-config.yaml
 create mode 100644 CHANGELOG.md
 create mode 100644 Dockerfile
 create mode 100644 Makefile
 create mode 100644 SECURITY.md
 create mode 100644 docker-compose.yml
 create mode 100644 docs/API.md
 create mode 100644 docs/DOCKER.md
 create mode 100644 pyproject.toml
 create mode 100644 requirements-api.txt
 create mode 100755 scripts/start_api.sh
 create mode 100755 scripts/train_model.sh
 create mode 100644 src/sentiment_analysis/api.py
 create mode 100644 src/sentiment_analysis/exceptions.py

diff --git a/.dockerignore b/.dockerignore
new file mode 100644
index 0000000..8d25bf0
--- /dev/null
+++ b/.dockerignore
@@ -0,0 +1,56 @@
+# Git
+.git
+.gitignore
+.gitattributes
+
+# Python
+__pycache__/
+*.py[cod]
+*$py.class
+*.so
+.Python
+*.egg-info/
+dist/
+build/
+*.egg
+
+# Virtual environments
+venv/
+env/
+ENV/
+.venv
+
+# IDE
+.vscode/
+.idea/
+*.swp
+*.swo
+*~
+
+# Project specific
+models/*.h5
+models/*.pkl
+data/*
+outputs/
+logs/
+*.log
+
+# Documentation
+docs/_build/
+
+# Tests
+.pytest_cache/
+.coverage
+htmlcov/
+.tox/
+
+# OS
+.DS_Store
+Thumbs.db
+
+# Jupyter
+.ipynb_checkpoints/
+
+# Temporary
+*.tmp
+*.bak
diff --git a/.editorconfig b/.editorconfig
new file mode 100644
index 0000000..405f1a5
--- /dev/null
+++ b/.editorconfig
@@ -0,0 +1,36 @@
+# EditorConfig is awesome: https://EditorConfig.org
+
+# top-most EditorConfig file
+root = true
+
+# Unix-style newlines with a newline ending every file
+[*]
+end_of_line = lf
+insert_final_newline = true
+charset = utf-8
+trim_trailing_whitespace = true
+
+# Python files
+[*.py]
+indent_style = space
+indent_size = 4
+max_line_length = 100
+
+# YAML files
+[*.{yml,yaml}]
+indent_style = space
+indent_size = 2
+
+# JSON files
+[*.json]
+indent_style = space
+indent_size = 2
+
+# Markdown files
+[*.md]
+trim_trailing_whitespace = false
+max_line_length = off
+
+# Makefile
+[Makefile]
+indent_style = tab
diff --git a/.env.example b/.env.example
new file mode 100644
index 0000000..6af4530
--- /dev/null
+++ b/.env.example
@@ -0,0 +1,51 @@
+# Environment Configuration Template
+# Copy this file to .env and customize the values
+
+# Model Configuration
+MODEL_PATH=models/sentiment_lstm_model.h5
+TOKENIZER_PATH=models/tokenizer.pkl
+HISTORY_PATH=models/training_history.json
+
+# Training Configuration
+EPOCHS=5
+BATCH_SIZE=128
+LEARNING_RATE=0.001
+VALIDATION_SPLIT=0.2
+
+# Model Architecture
+VOCAB_SIZE=10000
+MAX_LENGTH=300
+EMBEDDING_DIM=128
+LSTM_UNITS_1=64
+LSTM_UNITS_2=32
+DROPOUT_RATE=0.5
+
+# Logging
+LOG_LEVEL=INFO
+LOG_FILE=logs/sentiment_analysis.log
+
+# Directories
+DATA_DIR=data
+MODELS_DIR=models
+OUTPUTS_DIR=outputs
+LOGS_DIR=logs
+
+# TensorFlow Configuration
+TF_CPP_MIN_LOG_LEVEL=2
+CUDA_VISIBLE_DEVICES=0
+
+# API Configuration (for FastAPI)
+API_HOST=0.0.0.0
+API_PORT=8000
+API_WORKERS=4
+API_RELOAD=false
+
+# Database (optional, for production deployments)
+# DATABASE_URL=postgresql://user:password@localhost/sentiment_db
+
+# Redis (optional, for caching)
+# REDIS_URL=redis://localhost:6379/0
+
+# Monitoring (optional)
+# SENTRY_DSN=https://...
+# PROMETHEUS_PORT=9090
diff --git a/.flake8 b/.flake8
new file mode 100644
index 0000000..68f2bcd
--- /dev/null
+++ b/.flake8
@@ -0,0 +1,18 @@
+[flake8]
+max-line-length = 100
+extend-ignore = E203, W503, E501
+exclude =
+    .git,
+    __pycache__,
+    .venv,
+    venv,
+    .tox,
+    build,
+    dist,
+    *.egg-info,
+    .pytest_cache,
+    .mypy_cache
+per-file-ignores =
+    __init__.py:F401
+max-complexity = 10
+docstring-convention = google
diff --git a/.github/ISSUE_TEMPLATE/bug_report.md b/.github/ISSUE_TEMPLATE/bug_report.md
new file mode 100644
index 0000000..4b8597c
--- /dev/null
+++ b/.github/ISSUE_TEMPLATE/bug_report.md
@@ -0,0 +1,39 @@
+---
+name: Bug Report
+about: Create a report to help us improve
+title: '[BUG] '
+labels: bug
+assignees: ''
+---
+
+## Bug Description
+A clear and concise description of what the bug is.
+
+## To Reproduce
+Steps to reproduce the behavior:
+1. Go to '...'
+2. Run '....'
+3. See error
+
+## Expected Behavior
+A clear and concise description of what you expected to happen.
+
+## Actual Behavior
+What actually happened.
+
+## Error Messages/Logs
+```
+Paste any error messages or logs here
+```
+
+## Environment
+- OS: [e.g., Ubuntu 20.04, Windows 10, macOS 12]
+- Python Version: [e.g., 3.10.5]
+- TensorFlow Version: [e.g., 2.10.0]
+- Package Version: [e.g., 1.0.0]
+
+## Additional Context
+Add any other context about the problem here, such as:
+- Screenshots
+- Related issues
+- Possible solutions you've tried
diff --git a/.github/ISSUE_TEMPLATE/feature_request.md b/.github/ISSUE_TEMPLATE/feature_request.md
new file mode 100644
index 0000000..5bdf2e0
--- /dev/null
+++ b/.github/ISSUE_TEMPLATE/feature_request.md
@@ -0,0 +1,22 @@
+---
+name: Feature Request
+about: Suggest an idea for this project
+title: '[FEATURE] '
+labels: enhancement
+assignees: ''
+---
+
+## Is your feature request related to a problem?
+A clear and concise description of what the problem is. Ex. I'm always frustrated when [...]
+
+## Describe the solution you'd like
+A clear and concise description of what you want to happen.
+
+## Describe alternatives you've considered
+A clear and concise description of any alternative solutions or features you've considered.
+
+## Additional context
+Add any other context, screenshots, or examples about the feature request here.
+
+## Potential Implementation
+If you have ideas about how to implement this feature, please share them here.
diff --git a/.github/pull_request_template.md b/.github/pull_request_template.md
new file mode 100644
index 0000000..5ef7dd3
--- /dev/null
+++ b/.github/pull_request_template.md
@@ -0,0 +1,34 @@
+## Description
+Please include a summary of the changes and which issue is fixed. Include relevant motivation and context.
+
+Fixes # (issue)
+
+## Type of Change
+Please delete options that are not relevant.
+
+- [ ] Bug fix (non-breaking change which fixes an issue)
+- [ ] New feature (non-breaking change which adds functionality)
+- [ ] Breaking change (fix or feature that would cause existing functionality to not work as expected)
+- [ ] Documentation update
+- [ ] Performance improvement
+- [ ] Code refactoring
+
+## How Has This Been Tested?
+Please describe the tests that you ran to verify your changes.
+
+- [ ] Test A
+- [ ] Test B
+
+## Checklist
+- [ ] My code follows the style guidelines of this project
+- [ ] I have performed a self-review of my own code
+- [ ] I have commented my code, particularly in hard-to-understand areas
+- [ ] I have made corresponding changes to the documentation
+- [ ] My changes generate no new warnings
+- [ ] I have added tests that prove my fix is effective or that my feature works
+- [ ] New and existing unit tests pass locally with my changes
+- [ ] Any dependent changes have been merged and published
+
+## Screenshots (if appropriate)
+
+## Additional Notes
diff --git a/.github/workflows/ci.yml b/.github/workflows/ci.yml
new file mode 100644
index 0000000..8eb0dcf
--- /dev/null
+++ b/.github/workflows/ci.yml
@@ -0,0 +1,157 @@
+name: CI/CD Pipeline
+
+on:
+  push:
+    branches: [ main, develop ]
+  pull_request:
+    branches: [ main, develop ]
+  workflow_dispatch:
+
+jobs:
+  # Code quality checks
+  lint:
+    name: Code Quality
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: '3.10'
+
+      - name: Cache pip packages
+        uses: actions/cache@v3
+        with:
+          path: ~/.cache/pip
+          key: ${{ runner.os }}-pip-${{ hashFiles('requirements.txt') }}
+          restore-keys: |
+            ${{ runner.os }}-pip-
+
+      - name: Install dependencies
+        run: |
+          python -m pip install --upgrade pip
+          pip install black flake8 isort mypy
+          pip install -r requirements.txt
+
+      - name: Run black
+        run: black --check src/ tests/
+        continue-on-error: true
+
+      - name: Run isort
+        run: isort --check-only src/ tests/
+        continue-on-error: true
+
+      - name: Run flake8
+        run: flake8 src/ tests/ --max-line-length=100 --extend-ignore=E203,W503
+        continue-on-error: true
+
+  # Unit tests
+  test:
+    name: Tests
+    runs-on: ${{ matrix.os }}
+    strategy:
+      fail-fast: false
+      matrix:
+        os: [ubuntu-latest, macos-latest, windows-latest]
+        python-version: ['3.8', '3.9', '3.10', '3.11']
+        exclude:
+          - os: macos-latest
+            python-version: '3.8'
+          - os: windows-latest
+            python-version: '3.8'
+
+    steps:
+      - uses: actions/checkout@v3
+
+      - name: Set up Python ${{ matrix.python-version }}
+        uses: actions/setup-python@v4
+        with:
+          python-version: ${{ matrix.python-version }}
+
+      - name: Cache pip packages
+        uses: actions/cache@v3
+        with:
+          path: ~/.cache/pip
+          key: ${{ runner.os }}-pip-${{ hashFiles('requirements.txt') }}
+
+      - name: Install dependencies
+        run: |
+          python -m pip install --upgrade pip
+          pip install -r requirements.txt
+          pip install pytest pytest-cov
+          pip install -e .
+
+      - name: Run tests
+        run: |
+          pytest tests/ -v --cov=sentiment_analysis --cov-report=xml --cov-report=term
+
+      - name: Upload coverage
+        if: matrix.os == 'ubuntu-latest' && matrix.python-version == '3.10'
+        uses: codecov/codecov-action@v3
+        with:
+          file: ./coverage.xml
+          flags: unittests
+          name: codecov-umbrella
+
+  # Security scan
+  security:
+    name: Security Scan
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+
+      - name: Run Bandit
+        uses: tj-actions/bandit@v5.1
+        with:
+          targets: |
+            src/
+          options: "-r -ll"
+
+      - name: Run Safety check
+        run: |
+          pip install safety
+          safety check --json || true
+
+  # Docker build
+  docker:
+    name: Docker Build
+    runs-on: ubuntu-latest
+    needs: [lint, test]
+    steps:
+      - uses: actions/checkout@v3
+
+      - name: Set up Docker Buildx
+        uses: docker/setup-buildx-action@v2
+
+      - name: Build Docker image
+        uses: docker/build-push-action@v4
+        with:
+          context: .
+          push: false
+          tags: sentiment-analysis-lstm:latest
+          cache-from: type=gha
+          cache-to: type=gha,mode=max
+
+      - name: Test Docker image
+        run: |
+          docker build -t sentiment-analysis-lstm:test .
+          docker run --rm sentiment-analysis-lstm:test python -c "import sentiment_analysis; print('Docker image works!')"
+
+  # Documentation
+  docs:
+    name: Documentation
+    runs-on: ubuntu-latest
+    steps:
+      - uses: actions/checkout@v3
+
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: '3.10'
+
+      - name: Check documentation
+        run: |
+          python -m pip install --upgrade pip
+          pip install pydocstyle
+          pydocstyle src/ || true
diff --git a/.github/workflows/release.yml b/.github/workflows/release.yml
new file mode 100644
index 0000000..f1584a2
--- /dev/null
+++ b/.github/workflows/release.yml
@@ -0,0 +1,43 @@
+name: Release
+
+on:
+  release:
+    types: [published]
+  workflow_dispatch:
+
+jobs:
+  build-and-publish:
+    name: Build and Publish
+    runs-on: ubuntu-latest
+
+    steps:
+      - uses: actions/checkout@v3
+
+      - name: Set up Python
+        uses: actions/setup-python@v4
+        with:
+          python-version: '3.10'
+
+      - name: Install dependencies
+        run: |
+          python -m pip install --upgrade pip
+          pip install build twine
+
+      - name: Build package
+        run: python -m build
+
+      - name: Check package
+        run: twine check dist/*
+
+      - name: Publish to PyPI
+        if: github.event_name == 'release'
+        env:
+          TWINE_USERNAME: __token__
+          TWINE_PASSWORD: ${{ secrets.PYPI_API_TOKEN }}
+        run: twine upload dist/*
+
+      - name: Create GitHub Release Assets
+        if: github.event_name == 'release'
+        uses: softprops/action-gh-release@v1
+        with:
+          files: dist/*
diff --git a/.pre-commit-config.yaml b/.pre-commit-config.yaml
new file mode 100644
index 0000000..dcf75fb
--- /dev/null
+++ b/.pre-commit-config.yaml
@@ -0,0 +1,83 @@
+# Pre-commit hooks for code quality
+# Install: pip install pre-commit
+# Setup: pre-commit install
+# Run manually: pre-commit run --all-files
+
+repos:
+  # General file checks
+  - repo: https://github.com/pre-commit/pre-commit-hooks
+    rev: v4.5.0
+    hooks:
+      - id: trailing-whitespace
+      - id: end-of-file-fixer
+      - id: check-yaml
+      - id: check-added-large-files
+        args: ['--maxkb=10000']
+      - id: check-json
+      - id: check-toml
+      - id: check-merge-conflict
+      - id: detect-private-key
+      - id: mixed-line-ending
+      - id: check-case-conflict
+
+  # Python code formatting with black
+  - repo: https://github.com/psf/black
+    rev: 23.12.1
+    hooks:
+      - id: black
+        language_version: python3.10
+        args: ['--line-length=100']
+
+  # Import sorting with isort
+  - repo: https://github.com/PyCQA/isort
+    rev: 5.13.2
+    hooks:
+      - id: isort
+        args: ['--profile=black', '--line-length=100']
+
+  # Linting with flake8
+  - repo: https://github.com/PyCQA/flake8
+    rev: 7.0.0
+    hooks:
+      - id: flake8
+        args: ['--max-line-length=100', '--extend-ignore=E203,W503']
+        additional_dependencies: [flake8-docstrings]
+
+  # Type checking with mypy
+  - repo: https://github.com/pre-commit/mirrors-mypy
+    rev: v1.8.0
+    hooks:
+      - id: mypy
+        additional_dependencies: [types-all]
+        args: ['--ignore-missing-imports', '--no-strict-optional']
+        exclude: ^tests/
+
+  # Security checks with bandit
+  - repo: https://github.com/PyCQA/bandit
+    rev: 1.7.6
+    hooks:
+      - id: bandit
+        args: ['-r', 'src/', '-ll']
+        exclude: ^tests/
+
+  # Docstring coverage
+  - repo: https://github.com/econchick/interrogate
+    rev: 1.5.0
+    hooks:
+      - id: interrogate
+        args: ['--verbose', '--fail-under=80', 'src/']
+        pass_filenames: false
+
+  # Check for common security issues
+  - repo: https://github.com/Lucas-C/pre-commit-hooks-safety
+    rev: v1.3.3
+    hooks:
+      - id: python-safety-dependencies-check
+        files: requirements.txt
+
+  # Prettier for JSON, YAML, Markdown
+  - repo: https://github.com/pre-commit/mirrors-prettier
+    rev: v4.0.0-alpha.8
+    hooks:
+      - id: prettier
+        types_or: [json, yaml, markdown]
diff --git a/CHANGELOG.md b/CHANGELOG.md
new file mode 100644
index 0000000..de7d243
--- /dev/null
+++ b/CHANGELOG.md
@@ -0,0 +1,76 @@
+# Changelog
+
+All notable changes to this project will be documented in this file.
+
+The format is based on [Keep a Changelog](https://keepachangelog.com/en/1.0.0/),
+and this project adheres to [Semantic Versioning](https://semver.org/spec/v2.0.0.html).
+
+## [Unreleased]
+
+### Added
+- Production-ready features and infrastructure
+
+## [1.0.0] - 2024-01-XX
+
+### Added
+- Complete repository reorganization with modular architecture
+- Modular package structure under `src/sentiment_analysis/`
+- Separated concerns into dedicated modules:
+  - `config.py` - Configuration management
+  - `data_loader.py` - Data loading and preprocessing
+  - `model.py` - LSTM model architecture with variants
+  - `train.py` - Training logic with callbacks
+  - `predict.py` - Prediction logic with batch support
+  - `utils.py` - Utility functions and helpers
+  - `visualization.py` - Comprehensive plotting functions
+  - `cli.py` - Command-line interface
+  - `exceptions.py` - Custom exception classes
+  - `api.py` - REST API with FastAPI
+- CLI tools (`sentiment-train`, `sentiment-predict`)
+- Python API for programmatic access
+- Comprehensive unit tests with pytest
+- Multiple usage examples (basic, custom, interactive)
+- Jupyter notebook tutorial
+- Model persistence (save/load functionality)
+- Training callbacks (early stopping, checkpointing, LR reduction)
+- Rich visualizations (training curves, confusion matrix, ROC curves)
+- Configuration management system
+- Logging throughout the application
+- Docker support (Dockerfile, docker-compose.yml)
+- GitHub Actions CI/CD workflows
+- Pre-commit hooks configuration
+- Environment variable support (.env.example)
+- Makefile for common development tasks
+- Type checking configuration (mypy)
+- Code formatting configuration (black, isort, flake8)
+- Issue templates and PR template
+- Comprehensive documentation (README.md, CONTRIBUTING.md)
+
+### Changed
+- Transformed from single monolithic script to professional package
+- Enhanced README with detailed usage instructions
+- Updated .gitignore for new project structure
+
+### Fixed
+- Various code quality improvements
+- Better error handling with custom exceptions
+
+## [0.1.0] - Initial Release
+
+### Added
+- Basic sentiment analysis with LSTM
+- Single monolithic script implementation
+- IMDB dataset support
+- Basic model training and prediction
+- Simple visualization of training results
+
+---
+
+## Legend
+
+- **Added** for new features
+- **Changed** for changes in existing functionality
+- **Deprecated** for soon-to-be removed features
+- **Removed** for now removed features
+- **Fixed** for any bug fixes
+- **Security** for vulnerability fixes
diff --git a/Dockerfile b/Dockerfile
new file mode 100644
index 0000000..4264277
--- /dev/null
+++ b/Dockerfile
@@ -0,0 +1,66 @@
+# Multi-stage Dockerfile for Sentiment Analysis LSTM
+
+# Stage 1: Builder
+FROM python:3.10-slim as builder
+
+# Set working directory
+WORKDIR /app
+
+# Install build dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    build-essential \
+    gcc \
+    g++ \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy requirements
+COPY requirements.txt .
+
+# Install Python dependencies
+RUN pip install --no-cache-dir --user -r requirements.txt
+
+# Stage 2: Runtime
+FROM python:3.10-slim
+
+# Set working directory
+WORKDIR /app
+
+# Install runtime dependencies
+RUN apt-get update && apt-get install -y --no-install-recommends \
+    libgomp1 \
+    && rm -rf /var/lib/apt/lists/*
+
+# Copy Python packages from builder
+COPY --from=builder /root/.local /root/.local
+
+# Copy application code
+COPY src/ ./src/
+COPY setup.py .
+COPY README.md .
+COPY LICENSE .
+
+# Install the package
+RUN pip install --no-cache-dir -e .
+
+# Create necessary directories
+RUN mkdir -p /app/data /app/models /app/logs /app/outputs
+
+# Set environment variables
+ENV PYTHONUNBUFFERED=1 \
+    PYTHONDONTWRITEBYTECODE=1 \
+    PATH=/root/.local/bin:$PATH
+
+# Expose port for API (if running API)
+EXPOSE 8000
+
+# Health check
+HEALTHCHECK --interval=30s --timeout=10s --start-period=5s --retries=3 \
+    CMD python -c "import sentiment_analysis; print('healthy')" || exit 1
+
+# Default command
+CMD ["python", "-m", "sentiment_analysis.cli"]
+
+# Labels
+LABEL maintainer="your.email@example.com" \
+      version="1.0.0" \
+      description="Sentiment Analysis with LSTM - Production Ready"
diff --git a/Makefile b/Makefile
new file mode 100644
index 0000000..880447f
--- /dev/null
+++ b/Makefile
@@ -0,0 +1,159 @@
+.PHONY: help install install-dev test lint format clean docker-build docker-run train predict
+
+# Default target
+.DEFAULT_GOAL := help
+
+# Variables
+PYTHON := python3
+PIP := pip3
+PYTEST := pytest
+BLACK := black
+ISORT := isort
+FLAKE8 := flake8
+DOCKER := docker
+DOCKER_COMPOSE := docker-compose
+
+help: ## Show this help message
+	@echo 'Usage: make [target]'
+	@echo ''
+	@echo 'Available targets:'
+	@awk 'BEGIN {FS = ":.*?## "} /^[a-zA-Z_-]+:.*?## / {printf "  \033[36m%-20s\033[0m %s\n", $$1, $$2}' $(MAKEFILE_LIST)
+
+install: ## Install package and dependencies
+	$(PIP) install -r requirements.txt
+	$(PIP) install -e .
+
+install-dev: ## Install package with development dependencies
+	$(PIP) install -r requirements.txt
+	$(PIP) install -e ".[dev]"
+	pre-commit install
+
+test: ## Run tests
+	$(PYTEST) tests/ -v --cov=sentiment_analysis --cov-report=html --cov-report=term
+
+test-fast: ## Run tests without coverage
+	$(PYTEST) tests/ -v
+
+lint: ## Run linters
+	$(FLAKE8) src/ tests/
+	$(BLACK) --check src/ tests/
+	$(ISORT) --check-only src/ tests/
+
+format: ## Format code with black and isort
+	$(BLACK) src/ tests/ examples/
+	$(ISORT) src/ tests/ examples/
+
+type-check: ## Run type checking with mypy
+	mypy src/
+
+clean: ## Clean build artifacts
+	rm -rf build/
+	rm -rf dist/
+	rm -rf *.egg-info
+	rm -rf .pytest_cache
+	rm -rf .coverage
+	rm -rf htmlcov/
+	rm -rf .mypy_cache
+	rm -rf .tox/
+	find . -type d -name __pycache__ -exec rm -rf {} +
+	find . -type f -name "*.pyc" -delete
+
+clean-models: ## Clean saved models
+	rm -rf models/*.h5
+	rm -rf models/*.pkl
+	rm -rf models/*.json
+
+clean-all: clean clean-models ## Clean everything
+
+# Docker targets
+docker-build: ## Build Docker image
+	$(DOCKER) build -t sentiment-analysis-lstm:latest .
+
+docker-run: ## Run Docker container
+	$(DOCKER) run -it --rm -v $(PWD)/models:/app/models sentiment-analysis-lstm:latest
+
+docker-compose-up: ## Start all services with docker-compose
+	$(DOCKER_COMPOSE) up -d
+
+docker-compose-down: ## Stop all services
+	$(DOCKER_COMPOSE) down
+
+docker-compose-logs: ## View logs from docker-compose
+	$(DOCKER_COMPOSE) logs -f
+
+# Training and prediction
+train: ## Train the model
+	$(PYTHON) -m sentiment_analysis.cli train
+
+train-custom: ## Train with custom parameters (epochs=10, batch-size=64)
+	$(PYTHON) -m sentiment_analysis.cli train --epochs 10 --batch-size 64
+
+predict: ## Run example predictions
+	$(PYTHON) -m sentiment_analysis.cli predict --examples
+
+predict-text: ## Predict sentiment for a text (use TEXT="your text")
+	$(PYTHON) -m sentiment_analysis.cli predict --text "$(TEXT)"
+
+# Development
+dev-server: ## Run development server (if API is implemented)
+	uvicorn sentiment_analysis.api:app --reload --host 0.0.0.0 --port 8000
+
+notebook: ## Start Jupyter notebook
+	jupyter notebook notebooks/
+
+# Pre-commit
+pre-commit-install: ## Install pre-commit hooks
+	pre-commit install
+
+pre-commit-run: ## Run pre-commit on all files
+	pre-commit run --all-files
+
+# Build and distribution
+build: clean ## Build package
+	$(PYTHON) -m build
+
+publish-test: build ## Publish to TestPyPI
+	$(PYTHON) -m twine upload --repository testpypi dist/*
+
+publish: build ## Publish to PyPI
+	$(PYTHON) -m twine upload dist/*
+
+# Documentation
+docs: ## Build documentation (if using Sphinx)
+	cd docs && make html
+
+# CI/CD
+ci: lint test ## Run CI checks locally
+
+# Security
+security-check: ## Run security checks
+	safety check
+	bandit -r src/
+
+# Database migrations (if using databases)
+# db-init: ## Initialize database
+#	alembic init migrations
+
+# db-migrate: ## Create new migration
+#	alembic revision --autogenerate -m "$(MSG)"
+
+# db-upgrade: ## Apply migrations
+#	alembic upgrade head
+
+# Monitoring and profiling
+profile: ## Profile the training code
+	$(PYTHON) -m cProfile -o profile.stats examples/basic_usage.py
+	$(PYTHON) -m pstats profile.stats
+
+# Version management
+version: ## Show current version
+	@$(PYTHON) -c "import sentiment_analysis; print(sentiment_analysis.__version__)"
+
+bump-patch: ## Bump patch version
+	bump2version patch
+
+bump-minor: ## Bump minor version
+	bump2version minor
+
+bump-major: ## Bump major version
+	bump2version major
diff --git a/SECURITY.md b/SECURITY.md
new file mode 100644
index 0000000..d546492
--- /dev/null
+++ b/SECURITY.md
@@ -0,0 +1,128 @@
+# Security Policy
+
+## Supported Versions
+
+We release patches for security vulnerabilities in the following versions:
+
+| Version | Supported          |
+| ------- | ------------------ |
+| 1.0.x   | :white_check_mark: |
+| < 1.0   | :x:                |
+
+## Reporting a Vulnerability
+
+We take the security of Sentiment Analysis LSTM seriously. If you believe you have found a security vulnerability, please report it to us as described below.
+
+### How to Report a Security Vulnerability
+
+**Please do not report security vulnerabilities through public GitHub issues.**
+
+Instead, please report them via email to: [your.email@example.com]
+
+You should receive a response within 48 hours. If for some reason you do not, please follow up via email to ensure we received your original message.
+
+### What to Include in Your Report
+
+Please include the following information:
+
+- Type of vulnerability (e.g., XSS, SQLi, etc.)
+- Full paths of source file(s) related to the vulnerability
+- The location of the affected source code (tag/branch/commit or direct URL)
+- Any special configuration required to reproduce the issue
+- Step-by-step instructions to reproduce the issue
+- Proof-of-concept or exploit code (if possible)
+- Impact of the issue, including how an attacker might exploit it
+
+### What to Expect
+
+- We will acknowledge receipt of your vulnerability report
+- We will send you a more detailed response indicating the next steps
+- We will work with you to understand and resolve the issue
+- We will keep you informed about our progress
+- We will credit you in the security advisory (if you wish)
+
+## Security Best Practices
+
+When using this package in production:
+
+### 1. Model Security
+- Store trained models in secure locations
+- Use access controls for model files
+- Validate model integrity before loading
+
+### 2. Input Validation
+- Always validate user input before processing
+- Set appropriate text length limits
+- Sanitize inputs to prevent injection attacks
+
+### 3. API Security
+- Use HTTPS in production
+- Implement rate limiting
+- Add authentication and authorization
+- Configure CORS appropriately
+- Use environment variables for sensitive configuration
+
+### 4. Dependency Security
+- Regularly update dependencies
+- Use `safety` to check for known vulnerabilities
+- Pin dependency versions in production
+
+### 5. Data Privacy
+- Don't log sensitive user data
+- Implement proper data retention policies
+- Comply with GDPR/CCPA if applicable
+
+### 6. Docker Security
+- Don't run containers as root
+- Use minimal base images
+- Scan images for vulnerabilities
+- Keep base images updated
+
+## Security Checklist for Production
+
+- [ ] HTTPS enabled
+- [ ] Authentication implemented
+- [ ] Rate limiting configured
+- [ ] Input validation in place
+- [ ] Dependencies updated
+- [ ] Security headers configured
+- [ ] Logging and monitoring enabled
+- [ ] Secrets stored securely (not in code)
+- [ ] Regular security audits scheduled
+- [ ] Incident response plan in place
+
+## Known Security Considerations
+
+### TensorFlow Security
+- Keep TensorFlow updated to latest stable version
+- Be aware of potential model poisoning attacks
+- Validate model files from untrusted sources
+
+### FastAPI Security
+- Configure CORS appropriately for your use case
+- Implement proper authentication
+- Use HTTPS in production
+- Enable rate limiting
+
+## Security Tools
+
+We use the following tools to maintain security:
+
+- **Bandit**: Python security linter
+- **Safety**: Dependency vulnerability checker
+- **Pre-commit hooks**: Automated security checks
+- **GitHub Security Alerts**: Dependency vulnerability notifications
+- **CodeQL**: Code security analysis (via GitHub Actions)
+
+## Disclosure Policy
+
+When we receive a security report, we will:
+
+1. Confirm the problem and determine affected versions
+2. Audit code to find similar problems
+3. Prepare fixes for all supported versions
+4. Release new versions as soon as possible
+
+## Comments on this Policy
+
+If you have suggestions on how this process could be improved, please submit a pull request or open an issue.
diff --git a/docker-compose.yml b/docker-compose.yml
new file mode 100644
index 0000000..1a66c58
--- /dev/null
+++ b/docker-compose.yml
@@ -0,0 +1,81 @@
+version: '3.8'
+
+services:
+  # Training service
+  sentiment-train:
+    build:
+      context: .
+      dockerfile: Dockerfile
+    container_name: sentiment-lstm-train
+    volumes:
+      - ./data:/app/data
+      - ./models:/app/models
+      - ./outputs:/app/outputs
+      - ./logs:/app/logs
+    environment:
+      - PYTHONUNBUFFERED=1
+      - TF_CPP_MIN_LOG_LEVEL=2
+    command: python -c "from sentiment_analysis.train import Trainer; trainer = Trainer(); data = trainer.prepare_data(); trainer.train(*data[0], *data[1], epochs=5)"
+    deploy:
+      resources:
+        limits:
+          cpus: '4'
+          memory: 8G
+        reservations:
+          cpus: '2'
+          memory: 4G
+
+  # API service
+  sentiment-api:
+    build:
+      context: .
+      dockerfile: Dockerfile
+    container_name: sentiment-lstm-api
+    ports:
+      - "8000:8000"
+    volumes:
+      - ./models:/app/models:ro
+      - ./logs:/app/logs
+    environment:
+      - PYTHONUNBUFFERED=1
+      - MODEL_PATH=/app/models/sentiment_lstm_model.h5
+    command: uvicorn sentiment_analysis.api:app --host 0.0.0.0 --port 8000 --reload
+    depends_on:
+      - sentiment-train
+    deploy:
+      resources:
+        limits:
+          cpus: '2'
+          memory: 4G
+    restart: unless-stopped
+
+  # Jupyter notebook service
+  sentiment-notebook:
+    build:
+      context: .
+      dockerfile: Dockerfile
+    container_name: sentiment-lstm-notebook
+    ports:
+      - "8888:8888"
+    volumes:
+      - ./notebooks:/app/notebooks
+      - ./data:/app/data
+      - ./models:/app/models
+      - ./src:/app/src
+    environment:
+      - JUPYTER_ENABLE_LAB=yes
+    command: jupyter lab --ip=0.0.0.0 --port=8888 --no-browser --allow-root --NotebookApp.token='' --NotebookApp.password=''
+    deploy:
+      resources:
+        limits:
+          memory: 2G
+
+volumes:
+  data:
+  models:
+  outputs:
+  logs:
+
+networks:
+  default:
+    name: sentiment-network
diff --git a/docs/API.md b/docs/API.md
new file mode 100644
index 0000000..3efea20
--- /dev/null
+++ b/docs/API.md
@@ -0,0 +1,392 @@
+# API Documentation
+
+REST API documentation for Sentiment Analysis LSTM.
+
+## Table of Contents
+
+- [Getting Started](#getting-started)
+- [Authentication](#authentication)
+- [Endpoints](#endpoints)
+- [Request/Response Examples](#requestresponse-examples)
+- [Error Handling](#error-handling)
+- [Rate Limiting](#rate-limiting)
+- [Deployment](#deployment)
+
+## Getting Started
+
+### Installation
+
+```bash
+# Install API dependencies
+pip install -r requirements-api.txt
+
+# Or install with extras
+pip install -e ".[api]"
+```
+
+### Running the API
+
+```bash
+# Development mode
+uvicorn sentiment_analysis.api:app --reload
+
+# Production mode
+uvicorn sentiment_analysis.api:app --host 0.0.0.0 --port 8000 --workers 4
+
+# Using the script
+bash scripts/start_api.sh
+
+# Using Makefile
+make dev-server
+```
+
+### Interactive Documentation
+
+Once running, access:
+- **Swagger UI**: http://localhost:8000/docs
+- **ReDoc**: http://localhost:8000/redoc
+
+## Authentication
+
+Currently, the API does not require authentication. For production use, implement authentication using:
+
+- API Keys
+- OAuth2
+- JWT tokens
+
+Example with API key (to be implemented):
+
+```python
+from fastapi import Header, HTTPException
+
+async def verify_api_key(x_api_key: str = Header(...)):
+    if x_api_key != "your-secret-key":
+        raise HTTPException(status_code=403, detail="Invalid API key")
+```
+
+## Endpoints
+
+### Root
+
+**GET /** - API Information
+
+Response:
+```json
+{
+  "name": "Sentiment Analysis API",
+  "version": "1.0.0",
+  "status": "running",
+  "docs": "/docs",
+  "health": "/health"
+}
+```
+
+### Health Check
+
+**GET /health** - Service Health Status
+
+Response:
+```json
+{
+  "status": "healthy",
+  "model_loaded": true,
+  "version": "1.0.0",
+  "timestamp": "2024-01-01T12:00:00"
+}
+```
+
+### Model Info
+
+**GET /model/info** - Model Configuration
+
+Response:
+```json
+{
+  "vocab_size": 10000,
+  "max_length": 300,
+  "embedding_dim": 128,
+  "model_path": "models/sentiment_lstm_model.h5",
+  "model_exists": true
+}
+```
+
+### Single Prediction
+
+**POST /predict** - Predict Single Text
+
+Request Body:
+```json
+{
+  "text": "This movie was amazing!"
+}
+```
+
+Response:
+```json
+{
+  "text": "This movie was amazing!",
+  "sentiment": "Positive",
+  "score": 0.9234,
+  "confidence": 0.8468,
+  "timestamp": "2024-01-01T12:00:00"
+}
+```
+
+### Batch Prediction
+
+**POST /predict/batch** - Predict Multiple Texts
+
+Request Body:
+```json
+{
+  "texts": [
+    "Great movie!",
+    "Terrible film.",
+    "It was okay."
+  ]
+}
+```
+
+Response:
+```json
+{
+  "predictions": [
+    {
+      "text": "Great movie!",
+      "sentiment": "Positive",
+      "score": 0.95,
+      "confidence": 0.90,
+      "timestamp": "2024-01-01T12:00:00"
+    },
+    {
+      "text": "Terrible film.",
+      "sentiment": "Negative",
+      "score": 0.12,
+      "confidence": 0.76,
+      "timestamp": "2024-01-01T12:00:00"
+    },
+    {
+      "text": "It was okay.",
+      "sentiment": "Positive",
+      "score": 0.58,
+      "confidence": 0.16,
+      "timestamp": "2024-01-01T12:00:00"
+    }
+  ],
+  "count": 3,
+  "timestamp": "2024-01-01T12:00:00"
+}
+```
+
+## Request/Response Examples
+
+### Using cURL
+
+```bash
+# Health check
+curl http://localhost:8000/health
+
+# Single prediction
+curl -X POST http://localhost:8000/predict \
+  -H "Content-Type: application/json" \
+  -d '{"text": "Amazing movie!"}'
+
+# Batch prediction
+curl -X POST http://localhost:8000/predict/batch \
+  -H "Content-Type: application/json" \
+  -d '{"texts": ["Great!", "Bad!", "Okay."]}'
+```
+
+### Using Python requests
+
+```python
+import requests
+
+# Single prediction
+response = requests.post(
+    "http://localhost:8000/predict",
+    json={"text": "This movie was fantastic!"}
+)
+print(response.json())
+
+# Batch prediction
+response = requests.post(
+    "http://localhost:8000/predict/batch",
+    json={"texts": ["Great movie!", "Terrible film.", "It was okay."]}
+)
+print(response.json())
+```
+
+### Using JavaScript/Fetch
+
+```javascript
+// Single prediction
+fetch('http://localhost:8000/predict', {
+  method: 'POST',
+  headers: {
+    'Content-Type': 'application/json',
+  },
+  body: JSON.stringify({
+    text: 'This movie was amazing!'
+  })
+})
+.then(response => response.json())
+.then(data => console.log(data));
+```
+
+## Error Handling
+
+### HTTP Status Codes
+
+- `200 OK` - Success
+- `422 Unprocessable Entity` - Validation error
+- `500 Internal Server Error` - Server error
+- `503 Service Unavailable` - Service not ready
+
+### Error Response Format
+
+```json
+{
+  "detail": "Error message here"
+}
+```
+
+### Common Errors
+
+**Empty text:**
+```json
+{
+  "detail": "Text cannot be empty or only whitespace"
+}
+```
+
+**Text too long:**
+```json
+{
+  "detail": "ensure this value has at most 10000 characters"
+}
+```
+
+**Model not loaded:**
+```json
+{
+  "detail": "Predictor not initialized. Please check if model is available."
+}
+```
+
+## Rate Limiting
+
+Implement rate limiting for production:
+
+```python
+from slowapi import Limiter, _rate_limit_exceeded_handler
+from slowapi.util import get_remote_address
+
+limiter = Limiter(key_func=get_remote_address)
+app.state.limiter = limiter
+app.add_exception_handler(RateLimitExceeded, _rate_limit_exceeded_handler)
+
+@app.post("/predict")
+@limiter.limit("100/minute")
+async def predict_sentiment(request: Request, ...):
+    ...
+```
+
+## Deployment
+
+### Using Docker
+
+```bash
+# Build
+docker build -t sentiment-api .
+
+# Run
+docker run -d -p 8000:8000 -v $(pwd)/models:/app/models:ro sentiment-api
+
+# With environment variables
+docker run -d \
+  -p 8000:8000 \
+  -e API_WORKERS=4 \
+  -v $(pwd)/models:/app/models:ro \
+  sentiment-api
+```
+
+### Using Docker Compose
+
+```bash
+docker-compose up -d sentiment-api
+```
+
+### Behind Nginx
+
+```nginx
+server {
+    listen 80;
+    server_name api.example.com;
+
+    location / {
+        proxy_pass http://localhost:8000;
+        proxy_set_header Host $host;
+        proxy_set_header X-Real-IP $remote_addr;
+        proxy_set_header X-Forwarded-For $proxy_add_x_forwarded_for;
+        proxy_set_header X-Forwarded-Proto $scheme;
+    }
+}
+```
+
+### Using Gunicorn
+
+```bash
+gunicorn sentiment_analysis.api:app \
+  -w 4 \
+  -k uvicorn.workers.UvicornWorker \
+  --bind 0.0.0.0:8000
+```
+
+### Environment Variables
+
+```bash
+export API_HOST=0.0.0.0
+export API_PORT=8000
+export API_WORKERS=4
+export MODEL_PATH=/path/to/model.h5
+```
+
+## Monitoring
+
+### Prometheus Metrics (to be implemented)
+
+```python
+from prometheus_fastapi_instrumentator import Instrumentator
+
+Instrumentator().instrument(app).expose(app)
+```
+
+### Health Checks
+
+```bash
+# Simple health check
+curl http://localhost:8000/health
+
+# Detailed check with jq
+curl -s http://localhost:8000/health | jq '.model_loaded'
+```
+
+## Performance Tips
+
+1. **Use batch predictions** for multiple texts
+2. **Enable caching** for frequently requested texts
+3. **Scale horizontally** with multiple workers
+4. **Use async workers** with Uvicorn
+5. **Implement connection pooling** for databases
+6. **Add Redis** for caching predictions
+
+## Security
+
+- Use HTTPS in production
+- Implement authentication
+- Add rate limiting
+- Validate all inputs
+- Configure CORS properly
+- Don't expose stack traces
+- Use environment variables for secrets
diff --git a/docs/DOCKER.md b/docs/DOCKER.md
new file mode 100644
index 0000000..a7a2716
--- /dev/null
+++ b/docs/DOCKER.md
@@ -0,0 +1,378 @@
+# Docker Guide
+
+This guide explains how to use Docker with the Sentiment Analysis LSTM project.
+
+## Table of Contents
+
+- [Prerequisites](#prerequisites)
+- [Building the Image](#building-the-image)
+- [Running Containers](#running-containers)
+- [Docker Compose](#docker-compose)
+- [Environment Variables](#environment-variables)
+- [Volumes](#volumes)
+- [Production Deployment](#production-deployment)
+
+## Prerequisites
+
+- Docker 20.10+
+- Docker Compose 2.0+ (optional)
+- At least 4GB RAM available for Docker
+- 10GB free disk space
+
+## Building the Image
+
+### Basic Build
+
+```bash
+docker build -t sentiment-analysis-lstm:latest .
+```
+
+### Build with specific platform
+
+```bash
+docker build --platform linux/amd64 -t sentiment-analysis-lstm:latest .
+```
+
+### Multi-stage build (already configured in Dockerfile)
+
+The Dockerfile uses multi-stage builds to minimize image size:
+- Stage 1: Builder (installs dependencies)
+- Stage 2: Runtime (minimal image with only necessary files)
+
+## Running Containers
+
+### Training
+
+```bash
+# Basic training
+docker run --rm \
+  -v $(pwd)/models:/app/models \
+  -v $(pwd)/data:/app/data \
+  sentiment-analysis-lstm:latest \
+  python -m sentiment_analysis.cli train
+
+# Training with custom parameters
+docker run --rm \
+  -v $(pwd)/models:/app/models \
+  -v $(pwd)/data:/app/data \
+  sentiment-analysis-lstm:latest \
+  python -m sentiment_analysis.cli train --epochs 10 --batch-size 64
+```
+
+### Prediction
+
+```bash
+# Example predictions
+docker run --rm \
+  -v $(pwd)/models:/app/models:ro \
+  sentiment-analysis-lstm:latest \
+  python -m sentiment_analysis.cli predict --examples
+
+# Single prediction
+docker run --rm \
+  -v $(pwd)/models:/app/models:ro \
+  sentiment-analysis-lstm:latest \
+  python -m sentiment_analysis.cli predict --text "Great movie!"
+```
+
+### API Server
+
+```bash
+docker run -d \
+  -p 8000:8000 \
+  -v $(pwd)/models:/app/models:ro \
+  --name sentiment-api \
+  sentiment-analysis-lstm:latest \
+  uvicorn sentiment_analysis.api:app --host 0.0.0.0 --port 8000
+```
+
+Access the API at: http://localhost:8000/docs
+
+## Docker Compose
+
+Docker Compose provides an easy way to run multiple services.
+
+### Start All Services
+
+```bash
+# Start in background
+docker-compose up -d
+
+# View logs
+docker-compose logs -f
+
+# Stop services
+docker-compose down
+```
+
+### Available Services
+
+1. **sentiment-train**: Training service
+2. **sentiment-api**: API server (port 8000)
+3. **sentiment-notebook**: Jupyter notebook (port 8888)
+
+### Individual Service Management
+
+```bash
+# Start only API
+docker-compose up -d sentiment-api
+
+# Restart training
+docker-compose restart sentiment-train
+
+# View API logs
+docker-compose logs -f sentiment-api
+```
+
+## Environment Variables
+
+### Available Variables
+
+```bash
+# Model paths
+MODEL_PATH=/app/models/sentiment_lstm_model.h5
+TOKENIZER_PATH=/app/models/tokenizer.pkl
+
+# Training
+EPOCHS=5
+BATCH_SIZE=128
+LEARNING_RATE=0.001
+
+# API
+API_HOST=0.0.0.0
+API_PORT=8000
+API_WORKERS=4
+
+# TensorFlow
+TF_CPP_MIN_LOG_LEVEL=2
+CUDA_VISIBLE_DEVICES=0
+```
+
+### Using .env File
+
+```bash
+# Create .env file
+cp .env.example .env
+
+# Edit with your values
+vim .env
+
+# Run with docker-compose (automatically loads .env)
+docker-compose up -d
+```
+
+### Passing Environment Variables
+
+```bash
+# Single variable
+docker run -e EPOCHS=10 sentiment-analysis-lstm:latest
+
+# Multiple variables
+docker run \
+  -e EPOCHS=10 \
+  -e BATCH_SIZE=64 \
+  sentiment-analysis-lstm:latest
+
+# From file
+docker run --env-file .env sentiment-analysis-lstm:latest
+```
+
+## Volumes
+
+### Recommended Volume Mounts
+
+```bash
+docker run \
+  -v $(pwd)/data:/app/data \        # Training data
+  -v $(pwd)/models:/app/models \    # Saved models
+  -v $(pwd)/outputs:/app/outputs \  # Visualizations
+  -v $(pwd)/logs:/app/logs \        # Log files
+  sentiment-analysis-lstm:latest
+```
+
+### Read-only Mounts
+
+For production API, mount models as read-only:
+
+```bash
+docker run \
+  -v $(pwd)/models:/app/models:ro \
+  sentiment-analysis-lstm:latest
+```
+
+## Production Deployment
+
+### Best Practices
+
+1. **Use specific image tags** (not `latest`)
+```bash
+docker build -t sentiment-analysis-lstm:1.0.0 .
+```
+
+2. **Set resource limits**
+```bash
+docker run \
+  --cpus=2 \
+  --memory=4g \
+  sentiment-analysis-lstm:1.0.0
+```
+
+3. **Use health checks**
+```bash
+docker run \
+  --health-cmd="python -c 'import sentiment_analysis'" \
+  --health-interval=30s \
+  --health-timeout=10s \
+  --health-retries=3 \
+  sentiment-analysis-lstm:1.0.0
+```
+
+4. **Run as non-root user** (add to Dockerfile)
+```dockerfile
+RUN useradd -m -u 1000 appuser
+USER appuser
+```
+
+5. **Use secrets for sensitive data**
+```bash
+docker secret create model_path /path/to/model.h5
+docker service create --secret model_path sentiment-analysis-lstm:1.0.0
+```
+
+### Docker Swarm Deployment
+
+```bash
+# Initialize swarm
+docker swarm init
+
+# Deploy stack
+docker stack deploy -c docker-compose.yml sentiment-stack
+
+# Scale services
+docker service scale sentiment-stack_sentiment-api=3
+
+# Update service
+docker service update --image sentiment-analysis-lstm:1.0.1 sentiment-stack_sentiment-api
+```
+
+### Kubernetes Deployment
+
+Example deployment:
+
+```yaml
+apiVersion: apps/v1
+kind: Deployment
+metadata:
+  name: sentiment-api
+spec:
+  replicas: 3
+  selector:
+    matchLabels:
+      app: sentiment-api
+  template:
+    metadata:
+      labels:
+        app: sentiment-api
+    spec:
+      containers:
+      - name: sentiment-api
+        image: sentiment-analysis-lstm:1.0.0
+        ports:
+        - containerPort: 8000
+        resources:
+          requests:
+            memory: "2Gi"
+            cpu: "1000m"
+          limits:
+            memory: "4Gi"
+            cpu: "2000m"
+        volumeMounts:
+        - name: models
+          mountPath: /app/models
+          readOnly: true
+      volumes:
+      - name: models
+        persistentVolumeClaim:
+          claimName: sentiment-models-pvc
+```
+
+## Troubleshooting
+
+### Container won't start
+
+```bash
+# Check logs
+docker logs <container-id>
+
+# Run interactively
+docker run -it sentiment-analysis-lstm:latest /bin/bash
+```
+
+### Out of memory
+
+```bash
+# Increase Docker memory limit
+# Or reduce batch size
+docker run -e BATCH_SIZE=32 sentiment-analysis-lstm:latest
+```
+
+### Model not found
+
+```bash
+# Verify volume mount
+docker run --rm -v $(pwd)/models:/app/models sentiment-analysis-lstm:latest ls -la /app/models
+
+# Train model if missing
+docker run --rm -v $(pwd)/models:/app/models sentiment-analysis-lstm:latest \
+  python -m sentiment_analysis.cli train
+```
+
+### Permission issues
+
+```bash
+# Fix permissions on host
+sudo chown -R $USER:$USER models/ data/ outputs/ logs/
+```
+
+## Advanced Usage
+
+### Building with BuildKit
+
+```bash
+DOCKER_BUILDKIT=1 docker build -t sentiment-analysis-lstm:latest .
+```
+
+### Multi-platform builds
+
+```bash
+docker buildx build --platform linux/amd64,linux/arm64 -t sentiment-analysis-lstm:latest .
+```
+
+### Inspect image
+
+```bash
+# View image layers
+docker history sentiment-analysis-lstm:latest
+
+# Inspect image
+docker inspect sentiment-analysis-lstm:latest
+
+# Scan for vulnerabilities
+docker scan sentiment-analysis-lstm:latest
+```
+
+## Cleaning Up
+
+```bash
+# Stop all containers
+docker-compose down
+
+# Remove volumes
+docker-compose down -v
+
+# Remove images
+docker rmi sentiment-analysis-lstm:latest
+
+# Clean system
+docker system prune -a
+```
diff --git a/pyproject.toml b/pyproject.toml
new file mode 100644
index 0000000..1c3669e
--- /dev/null
+++ b/pyproject.toml
@@ -0,0 +1,112 @@
+[build-system]
+requires = ["setuptools>=45", "wheel", "setuptools_scm[toml]>=6.2"]
+build-backend = "setuptools.build_meta"
+
+[project]
+name = "sentiment-analysis-lstm"
+version = "1.0.0"
+description = "Production-ready sentiment analysis using LSTM neural networks"
+readme = "README.md"
+requires-python = ">=3.8"
+license = {text = "MIT"}
+authors = [
+    {name = "Your Name", email = "your.email@example.com"}
+]
+keywords = ["sentiment-analysis", "lstm", "nlp", "deep-learning", "tensorflow"]
+classifiers = [
+    "Development Status :: 4 - Beta",
+    "Intended Audience :: Developers",
+    "Intended Audience :: Science/Research",
+    "Topic :: Scientific/Engineering :: Artificial Intelligence",
+    "Topic :: Text Processing :: Linguistic",
+    "License :: OSI Approved :: MIT License",
+    "Programming Language :: Python :: 3",
+    "Programming Language :: Python :: 3.8",
+    "Programming Language :: Python :: 3.9",
+    "Programming Language :: Python :: 3.10",
+    "Programming Language :: Python :: 3.11",
+]
+
+[project.urls]
+Homepage = "https://github.com/pyenthusiasts/Sentiment-Analysis-LSTM"
+Documentation = "https://github.com/pyenthusiasts/Sentiment-Analysis-LSTM#readme"
+Repository = "https://github.com/pyenthusiasts/Sentiment-Analysis-LSTM"
+Issues = "https://github.com/pyenthusiasts/Sentiment-Analysis-LSTM/issues"
+
+[tool.black]
+line-length = 100
+target-version = ['py38', 'py39', 'py310', 'py311']
+include = '\.pyi?$'
+exclude = '''
+/(
+    \.git
+  | \.venv
+  | \.tox
+  | build
+  | dist
+  | \.eggs
+)/
+'''
+
+[tool.isort]
+profile = "black"
+line_length = 100
+multi_line_output = 3
+include_trailing_comma = true
+force_grid_wrap = 0
+use_parentheses = true
+ensure_newline_before_comments = true
+skip_gitignore = true
+skip = [".venv", "venv", ".tox", "build", "dist"]
+
+[tool.mypy]
+python_version = "3.10"
+warn_return_any = true
+warn_unused_configs = true
+disallow_untyped_defs = false
+disallow_incomplete_defs = false
+check_untyped_defs = true
+no_implicit_optional = true
+warn_redundant_casts = true
+warn_unused_ignores = true
+warn_no_return = true
+follow_imports = "normal"
+ignore_missing_imports = true
+
+[[tool.mypy.overrides]]
+module = "tests.*"
+ignore_errors = true
+
+[tool.pytest.ini_options]
+minversion = "7.0"
+addopts = [
+    "-ra",
+    "--strict-markers",
+    "--strict-config",
+    "--showlocals",
+]
+testpaths = ["tests"]
+python_files = ["test_*.py"]
+python_classes = ["Test*"]
+python_functions = ["test_*"]
+
+[tool.coverage.run]
+source = ["src/sentiment_analysis"]
+omit = [
+    "*/tests/*",
+    "*/setup.py",
+]
+
+[tool.coverage.report]
+precision = 2
+show_missing = true
+skip_covered = false
+exclude_lines = [
+    "pragma: no cover",
+    "def __repr__",
+    "raise AssertionError",
+    "raise NotImplementedError",
+    "if __name__ == .__main__.:",
+    "if TYPE_CHECKING:",
+    "@abstractmethod",
+]
diff --git a/requirements-api.txt b/requirements-api.txt
new file mode 100644
index 0000000..3a1221d
--- /dev/null
+++ b/requirements-api.txt
@@ -0,0 +1,5 @@
+# API dependencies for FastAPI
+fastapi>=0.104.0
+uvicorn[standard]>=0.24.0
+pydantic>=2.0.0
+python-multipart>=0.0.6
diff --git a/scripts/start_api.sh b/scripts/start_api.sh
new file mode 100755
index 0000000..025b2a4
--- /dev/null
+++ b/scripts/start_api.sh
@@ -0,0 +1,39 @@
+#!/bin/bash
+# Start the FastAPI server
+
+set -e
+
+# Colors
+GREEN='\033[0;32m'
+NC='\033[0m'
+
+# Configuration
+HOST=${API_HOST:-0.0.0.0}
+PORT=${API_PORT:-8000}
+WORKERS=${API_WORKERS:-4}
+RELOAD=${API_RELOAD:-false}
+
+echo -e "${GREEN}Starting Sentiment Analysis API...${NC}"
+echo "Host: $HOST"
+echo "Port: $PORT"
+echo "Workers: $WORKERS"
+echo "Reload: $RELOAD"
+
+# Check if model exists
+if [ ! -f "models/sentiment_lstm_model.h5" ]; then
+    echo "Warning: Model file not found. Please train a model first."
+    echo "Run: make train"
+fi
+
+# Start server
+if [ "$RELOAD" = "true" ]; then
+    uvicorn sentiment_analysis.api:app \
+        --host "$HOST" \
+        --port "$PORT" \
+        --reload
+else
+    uvicorn sentiment_analysis.api:app \
+        --host "$HOST" \
+        --port "$PORT" \
+        --workers "$WORKERS"
+fi
diff --git a/scripts/train_model.sh b/scripts/train_model.sh
new file mode 100755
index 0000000..a0bbfd2
--- /dev/null
+++ b/scripts/train_model.sh
@@ -0,0 +1,43 @@
+#!/bin/bash
+# Training script with error handling and logging
+
+set -e  # Exit on error
+
+# Colors for output
+RED='\033[0;31m'
+GREEN='\033[0;32m'
+YELLOW='\033[1;33m'
+NC='\033[0m' # No Color
+
+# Configuration
+EPOCHS=${EPOCHS:-5}
+BATCH_SIZE=${BATCH_SIZE:-128}
+LOG_DIR="logs"
+MODEL_DIR="models"
+
+# Create directories
+mkdir -p "$LOG_DIR" "$MODEL_DIR"
+
+# Log file
+LOG_FILE="$LOG_DIR/training_$(date +%Y%m%d_%H%M%S).log"
+
+echo -e "${GREEN}Starting model training...${NC}"
+echo "Epochs: $EPOCHS"
+echo "Batch Size: $BATCH_SIZE"
+echo "Log file: $LOG_FILE"
+
+# Train model
+python -m sentiment_analysis.cli train \
+    --epochs "$EPOCHS" \
+    --batch-size "$BATCH_SIZE" \
+    --verbose 2 \
+    2>&1 | tee "$LOG_FILE"
+
+# Check if training was successful
+if [ $? -eq 0 ]; then
+    echo -e "${GREEN}Training completed successfully!${NC}"
+    echo "Model saved to: $MODEL_DIR/sentiment_lstm_model.h5"
+else
+    echo -e "${RED}Training failed! Check log file: $LOG_FILE${NC}"
+    exit 1
+fi
diff --git a/src/sentiment_analysis/api.py b/src/sentiment_analysis/api.py
new file mode 100644
index 0000000..8325722
--- /dev/null
+++ b/src/sentiment_analysis/api.py
@@ -0,0 +1,317 @@
+"""
+REST API for sentiment analysis using FastAPI.
+
+This module provides a production-ready REST API for sentiment analysis.
+Install FastAPI dependencies: pip install fastapi uvicorn python-multipart
+"""
+
+import os
+import logging
+from typing import List, Optional
+from datetime import datetime
+from pathlib import Path
+
+try:
+    from fastapi import FastAPI, HTTPException, status
+    from fastapi.middleware.cors import CORSMiddleware
+    from fastapi.responses import JSONResponse
+    from pydantic import BaseModel, Field, validator
+except ImportError:
+    raise ImportError(
+        "FastAPI dependencies not installed. "
+        "Install with: pip install fastapi uvicorn python-multipart pydantic"
+    )
+
+from sentiment_analysis.predict import Predictor
+from sentiment_analysis.config import ModelConfig
+from sentiment_analysis.exceptions import (
+    ModelNotFoundError,
+    PredictionError,
+    InvalidInputError,
+)
+from sentiment_analysis.utils import setup_logger
+
+logger = setup_logger(__name__)
+
+# API metadata
+API_VERSION = "1.0.0"
+API_TITLE = "Sentiment Analysis API"
+API_DESCRIPTION = """
+Production-ready sentiment analysis API using LSTM neural networks.
+
+## Features
+
+* **Predict** sentiment for single or batch texts
+* **Health check** endpoint for monitoring
+* **Model info** endpoint for model metadata
+* **CORS enabled** for cross-origin requests
+
+## Usage
+
+Send a POST request to `/predict` with text to analyze.
+"""
+
+# Create FastAPI app
+app = FastAPI(
+    title=API_TITLE,
+    description=API_DESCRIPTION,
+    version=API_VERSION,
+    docs_url="/docs",
+    redoc_url="/redoc",
+)
+
+# Add CORS middleware
+app.add_middleware(
+    CORSMiddleware,
+    allow_origins=["*"],  # In production, replace with specific origins
+    allow_credentials=True,
+    allow_methods=["*"],
+    allow_headers=["*"],
+)
+
+# Initialize predictor
+predictor = None
+
+
+# Request/Response models
+class PredictRequest(BaseModel):
+    """Request model for prediction."""
+
+    text: str = Field(..., min_length=1, max_length=10000, description="Text to analyze")
+
+    @validator("text")
+    def validate_text(cls, v):
+        if not v.strip():
+            raise ValueError("Text cannot be empty or only whitespace")
+        return v.strip()
+
+
+class BatchPredictRequest(BaseModel):
+    """Request model for batch prediction."""
+
+    texts: List[str] = Field(
+        ..., min_items=1, max_items=100, description="List of texts to analyze"
+    )
+
+    @validator("texts")
+    def validate_texts(cls, v):
+        cleaned = [text.strip() for text in v if text.strip()]
+        if not cleaned:
+            raise ValueError("At least one non-empty text is required")
+        return cleaned
+
+
+class PredictResponse(BaseModel):
+    """Response model for prediction."""
+
+    text: str = Field(..., description="Input text")
+    sentiment: str = Field(..., description="Predicted sentiment (Positive/Negative)")
+    score: float = Field(..., ge=0, le=1, description="Prediction score (0-1)")
+    confidence: float = Field(..., ge=0, le=1, description="Confidence level (0-1)")
+    timestamp: str = Field(..., description="Prediction timestamp")
+
+
+class BatchPredictResponse(BaseModel):
+    """Response model for batch prediction."""
+
+    predictions: List[PredictResponse]
+    count: int = Field(..., description="Number of predictions")
+    timestamp: str = Field(..., description="Batch prediction timestamp")
+
+
+class HealthResponse(BaseModel):
+    """Response model for health check."""
+
+    status: str = Field(..., description="Service status")
+    model_loaded: bool = Field(..., description="Whether model is loaded")
+    version: str = Field(..., description="API version")
+    timestamp: str = Field(..., description="Health check timestamp")
+
+
+class ModelInfoResponse(BaseModel):
+    """Response model for model information."""
+
+    vocab_size: int
+    max_length: int
+    embedding_dim: int
+    model_path: str
+    model_exists: bool
+
+
+# Startup event
+@app.on_event("startup")
+async def startup_event():
+    """Initialize predictor on startup."""
+    global predictor
+
+    try:
+        logger.info("Initializing predictor...")
+        model_path = os.getenv("MODEL_PATH", str(ModelConfig.MODEL_PATH))
+        predictor = Predictor(model_path=model_path)
+        logger.info("Predictor initialized successfully")
+    except Exception as e:
+        logger.error(f"Failed to initialize predictor: {e}")
+        # Continue without predictor - will return error on prediction requests
+
+
+# Root endpoint
+@app.get("/", tags=["General"])
+async def root():
+    """Root endpoint with API information."""
+    return {
+        "name": API_TITLE,
+        "version": API_VERSION,
+        "status": "running",
+        "docs": "/docs",
+        "health": "/health",
+    }
+
+
+# Health check endpoint
+@app.get("/health", response_model=HealthResponse, tags=["Monitoring"])
+async def health_check():
+    """
+    Health check endpoint for monitoring.
+
+    Returns service status and model availability.
+    """
+    model_loaded = predictor is not None and predictor.sentiment_model.model is not None
+
+    return HealthResponse(
+        status="healthy" if model_loaded else "degraded",
+        model_loaded=model_loaded,
+        version=API_VERSION,
+        timestamp=datetime.utcnow().isoformat(),
+    )
+
+
+# Model info endpoint
+@app.get("/model/info", response_model=ModelInfoResponse, tags=["Model"])
+async def get_model_info():
+    """
+    Get information about the loaded model.
+
+    Returns model configuration and status.
+    """
+    model_exists = Path(ModelConfig.MODEL_PATH).exists()
+
+    return ModelInfoResponse(
+        vocab_size=ModelConfig.VOCAB_SIZE,
+        max_length=ModelConfig.MAX_LENGTH,
+        embedding_dim=ModelConfig.EMBEDDING_DIM,
+        model_path=str(ModelConfig.MODEL_PATH),
+        model_exists=model_exists,
+    )
+
+
+# Prediction endpoint
+@app.post("/predict", response_model=PredictResponse, tags=["Prediction"])
+async def predict_sentiment(request: PredictRequest):
+    """
+    Predict sentiment for a single text.
+
+    - **text**: Text to analyze (required, 1-10000 characters)
+
+    Returns sentiment prediction with score and confidence.
+    """
+    if predictor is None:
+        raise HTTPException(
+            status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
+            detail="Predictor not initialized. Please check if model is available.",
+        )
+
+    try:
+        result = predictor.predict_text(request.text)
+        return PredictResponse(
+            text=result["text"],
+            sentiment=result["sentiment"],
+            score=result["score"],
+            confidence=result["confidence"],
+            timestamp=datetime.utcnow().isoformat(),
+        )
+    except Exception as e:
+        logger.error(f"Prediction error: {e}")
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail=f"Prediction failed: {str(e)}",
+        )
+
+
+# Batch prediction endpoint
+@app.post("/predict/batch", response_model=BatchPredictResponse, tags=["Prediction"])
+async def predict_batch(request: BatchPredictRequest):
+    """
+    Predict sentiment for multiple texts.
+
+    - **texts**: List of texts to analyze (1-100 texts)
+
+    Returns batch predictions with metadata.
+    """
+    if predictor is None:
+        raise HTTPException(
+            status_code=status.HTTP_503_SERVICE_UNAVAILABLE,
+            detail="Predictor not initialized. Please check if model is available.",
+        )
+
+    try:
+        results = predictor.predict_batch(request.texts)
+
+        predictions = [
+            PredictResponse(
+                text=r["text"],
+                sentiment=r["sentiment"],
+                score=r["score"],
+                confidence=r["confidence"],
+                timestamp=datetime.utcnow().isoformat(),
+            )
+            for r in results
+        ]
+
+        return BatchPredictResponse(
+            predictions=predictions,
+            count=len(predictions),
+            timestamp=datetime.utcnow().isoformat(),
+        )
+    except Exception as e:
+        logger.error(f"Batch prediction error: {e}")
+        raise HTTPException(
+            status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+            detail=f"Batch prediction failed: {str(e)}",
+        )
+
+
+# Error handlers
+@app.exception_handler(ModelNotFoundError)
+async def model_not_found_handler(request, exc):
+    return JSONResponse(
+        status_code=status.HTTP_404_NOT_FOUND,
+        content={"detail": str(exc)},
+    )
+
+
+@app.exception_handler(PredictionError)
+async def prediction_error_handler(request, exc):
+    return JSONResponse(
+        status_code=status.HTTP_500_INTERNAL_SERVER_ERROR,
+        content={"detail": str(exc)},
+    )
+
+
+@app.exception_handler(InvalidInputError)
+async def invalid_input_handler(request, exc):
+    return JSONResponse(
+        status_code=status.HTTP_422_UNPROCESSABLE_ENTITY,
+        content={"detail": str(exc)},
+    )
+
+
+# Run with: uvicorn sentiment_analysis.api:app --reload
+if __name__ == "__main__":
+    import uvicorn
+
+    uvicorn.run(
+        "sentiment_analysis.api:app",
+        host=os.getenv("API_HOST", "0.0.0.0"),
+        port=int(os.getenv("API_PORT", 8000)),
+        reload=True,
+    )
diff --git a/src/sentiment_analysis/exceptions.py b/src/sentiment_analysis/exceptions.py
new file mode 100644
index 0000000..33de879
--- /dev/null
+++ b/src/sentiment_analysis/exceptions.py
@@ -0,0 +1,66 @@
+"""
+Custom exceptions for the sentiment analysis package.
+"""
+
+
+class SentimentAnalysisError(Exception):
+    """Base exception for all sentiment analysis errors."""
+
+    pass
+
+
+class ModelNotFoundError(SentimentAnalysisError):
+    """Raised when a model file is not found."""
+
+    def __init__(self, model_path):
+        self.model_path = model_path
+        super().__init__(f"Model not found at: {model_path}")
+
+
+class ModelNotTrainedError(SentimentAnalysisError):
+    """Raised when attempting to use an untrained model."""
+
+    def __init__(self, message="Model has not been trained yet"):
+        super().__init__(message)
+
+
+class DataLoadError(SentimentAnalysisError):
+    """Raised when data loading fails."""
+
+    pass
+
+
+class InvalidInputError(SentimentAnalysisError):
+    """Raised when input data is invalid."""
+
+    pass
+
+
+class ConfigurationError(SentimentAnalysisError):
+    """Raised when configuration is invalid."""
+
+    pass
+
+
+class PreprocessingError(SentimentAnalysisError):
+    """Raised when preprocessing fails."""
+
+    pass
+
+
+class TrainingError(SentimentAnalysisError):
+    """Raised when training fails."""
+
+    pass
+
+
+class PredictionError(SentimentAnalysisError):
+    """Raised when prediction fails."""
+
+    pass
+
+
+class ValidationError(SentimentAnalysisError):
+    """Raised when validation fails."""
+
+    pass