mirror of
https://github.com/zebrajr/imdbscrapper.git
synced 2026-01-15 12:15:12 +00:00
Changed: Folder Structure
This commit is contained in:
@@ -6,6 +6,6 @@ WORKDIR /opt/imdbscrapper
|
||||
COPY requirements.txt ./
|
||||
RUN pip install --no-cache-dir -r requirements.txt
|
||||
|
||||
COPY src/ .
|
||||
COPY src/scrapper/ .
|
||||
|
||||
CMD ["python", "-u", "/opt/imdbscrapper/scrapper.py"]
|
||||
|
||||
@@ -5,10 +5,34 @@ services:
|
||||
image: zebrajr/imdbscrapper:latest
|
||||
volumes:
|
||||
#- '${PWD}/src:/opt/imdbscrapper:ro'
|
||||
- '${PWD}/storage:/opt/storage'
|
||||
- './src/scrapper/:/opt/imdbscrapper'
|
||||
user: 1000:1000
|
||||
environment:
|
||||
- START_URL=1000
|
||||
- END_URL=0
|
||||
- START_URL=600000
|
||||
- END_URL=450000
|
||||
- STEPUPCYCLE=100
|
||||
- PROCESSES=5
|
||||
- PROCESSES=10
|
||||
depends_on:
|
||||
- imdbdb
|
||||
|
||||
|
||||
imdbdb:
|
||||
container_name: imdbdb
|
||||
image: mariadb:10.6
|
||||
restart: unless-stopped
|
||||
environment:
|
||||
MYSQL_ROOT_PASSWORD: secret
|
||||
volumes:
|
||||
- "./storage/back/:/var/lib/mysql"
|
||||
|
||||
|
||||
phpmyadmin:
|
||||
container_name: imdbphpmyadmin
|
||||
image: phpmyadmin/phpmyadmin:5.0.1
|
||||
restart: unless-stopped
|
||||
environment:
|
||||
PMA_HOST: imdbdb
|
||||
PMA_USER: root
|
||||
PMA_PASSWORD: secret
|
||||
ports:
|
||||
- "1239:80"
|
||||
|
||||
@@ -1,2 +1,3 @@
|
||||
beautifulsoup4
|
||||
requests
|
||||
mysql-connector
|
||||
|
||||
@@ -5,6 +5,7 @@ import json
|
||||
import requests
|
||||
import csv
|
||||
import logging
|
||||
import mysql.connector
|
||||
from multiprocessing import Process
|
||||
from bs4 import BeautifulSoup
|
||||
|
||||
Reference in New Issue
Block a user