update readme
This commit is contained in:
parent
fb8c9bed6a
commit
993b2c7ca5
138
readme.md
138
readme.md
@ -1,128 +1,16 @@
|
|||||||
### Interaction Details
|
data munger
|
||||||
|
=================================================
|
||||||
|
|
||||||
* Maintain source definitions
|
organized storage and cleansing of disparate data
|
||||||
* List all sources
|
|
||||||
* change existing
|
|
||||||
* create new (with optional sample data to pre-poluate)
|
|
||||||
* option to step into regex config
|
|
||||||
|
|
||||||
* Regex Instructions (Maint/Inquire)
|
current formats
|
||||||
* select source
|
--------------------------------------------------
|
||||||
* list all targets for that source
|
* csv
|
||||||
* either edit existing target or make a new one
|
* json
|
||||||
* target editing
|
|
||||||
* for each component of the instruction
|
|
||||||
* be able to run ad-hoc regex
|
|
||||||
* add additional components
|
|
||||||
|
|
||||||
* Cross Reference List (Maint/Inquire)
|
functions
|
||||||
|
-------------------------------------------------
|
||||||
* for a given regex target
|
* define constraints to prevent overlap during import
|
||||||
* list all output values (or only not yet mapped) and give oportunity to assign alternate value under a different key
|
* manipulate with regex
|
||||||
|
* tag data en masse
|
||||||
* Run Import
|
* flatten into traditional tables for downstream analytics
|
||||||
|
|
||||||
* insert new data
|
|
||||||
|
|
||||||
### source definition
|
|
||||||
```
|
|
||||||
srce | jsonb_pretty
|
|
||||||
------+---------------------------------------------------
|
|
||||||
hunt | { +
|
|
||||||
| "name": "hunt", +
|
|
||||||
| "source": "client_file", +
|
|
||||||
| "schemas": { +
|
|
||||||
| "default": [ +
|
|
||||||
| { +
|
|
||||||
| "path": "{Date}", +
|
|
||||||
| "type": "date", +
|
|
||||||
| "column_name": "Date" +
|
|
||||||
| }, +
|
|
||||||
| { +
|
|
||||||
| "path": "{Reference Number}", +
|
|
||||||
| "type": "numeric", +
|
|
||||||
| "column_name": "Reference Number"+
|
|
||||||
| }, +
|
|
||||||
| { +
|
|
||||||
| "path": "{Payee Name}", +
|
|
||||||
| "type": "text", +
|
|
||||||
| "column_name": "Payee Name" +
|
|
||||||
| }, +
|
|
||||||
| { +
|
|
||||||
| "path": "{Memo}", +
|
|
||||||
| "type": "text", +
|
|
||||||
| "column_name": "Memo" +
|
|
||||||
| }, +
|
|
||||||
| { +
|
|
||||||
| "path": "{Amount}", +
|
|
||||||
| "type": "numeric", +
|
|
||||||
| "column_name": "Amount" +
|
|
||||||
| }, +
|
|
||||||
| { +
|
|
||||||
| "path": "{Category Name}", +
|
|
||||||
| "type": "text", +
|
|
||||||
| "column_name": "Cateogry Name" +
|
|
||||||
| } +
|
|
||||||
| ] +
|
|
||||||
| }, +
|
|
||||||
| "constraint": [ +
|
|
||||||
| "{Date}" +
|
|
||||||
| ], +
|
|
||||||
| "loading_function": "csv" +
|
|
||||||
| }
|
|
||||||
```
|
|
||||||
|
|
||||||
### regex definitions
|
|
||||||
|
|
||||||
```
|
|
||||||
srce | target | regex | seq
|
|
||||||
-------+----------+--------------------------------------------------------------------------------+-----
|
|
||||||
dcard | First 20 | { +| 2
|
|
||||||
| | "name": "First 20", +|
|
|
||||||
| | "srce": "dcard", +|
|
|
||||||
| | "regex": { +|
|
|
||||||
| | "defn": [ +|
|
|
||||||
| | { +|
|
|
||||||
| | "key": "{Description}", +|
|
|
||||||
| | "map": "y", +|
|
|
||||||
| | "flag": "", +|
|
|
||||||
| | "field": "f20", +|
|
|
||||||
| | "regex": ".{1,20}", +|
|
|
||||||
| | "retain": "y" +|
|
|
||||||
| | } +|
|
|
||||||
| | ], +|
|
|
||||||
| | "name": "First 20", +|
|
|
||||||
| | "where": [ +|
|
|
||||||
| | { +|
|
|
||||||
| | } +|
|
|
||||||
| | ], +|
|
|
||||||
| | "function": "extract", +|
|
|
||||||
| | "description": "pull first 20 characters from description for mapping"+|
|
|
||||||
| | }, +|
|
|
||||||
| | "sequence": 2 +|
|
|
||||||
| | } |
|
|
||||||
hunt | First 20 | { +| 1
|
|
||||||
| | "name": "First 20", +|
|
|
||||||
| | "srce": "hunt", +|
|
|
||||||
| | "regex": { +|
|
|
||||||
| | "defn": [ +|
|
|
||||||
| | { +|
|
|
||||||
| | "key": "{Memo}", +|
|
|
||||||
| | "map": "y", +|
|
|
||||||
| | "flag": "", +|
|
|
||||||
| | "field": "f20", +|
|
|
||||||
| | "regex": ".{1,20}", +|
|
|
||||||
| | "retain": "y" +|
|
|
||||||
| | } +|
|
|
||||||
| | ], +|
|
|
||||||
| | "name": "First 20", +|
|
|
||||||
| | "where": [ +|
|
|
||||||
| | { +|
|
|
||||||
| | } +|
|
|
||||||
| | ], +|
|
|
||||||
| | "function": "extract", +|
|
|
||||||
| | "description": "pull first 20 characters from description for mapping"+|
|
|
||||||
| | }, +|
|
|
||||||
| | "sequence": 1 +|
|
|
||||||
| | } |
|
|
||||||
```
|
|
Loading…
Reference in New Issue
Block a user