OpenRefine (formerly Google Refine) is a powerful tool for working with messy data: cleaning it; transforming it from one format into another; and extending it with web services and external data.
Please read the wiki to learn more.
version: "3.8"
services:
openrefine:
image: easypi/openrefine
ports:
- "3333:3333"
volumes:
- ./data:/data
environment:
- REFINE_INTERFACE=0.0.0.0
- REFINE_PORT=3333
- REFINE_MIN_MEMORY=1024M
- REFINE_MEMORY=1024M
- REFINE_DATA_DIR=/data
- REFINE_EXTRA_OPTS=refine.headless=true
restart: unless-stopped