knitr::opts_chunk$set(
  warning = FALSE, # show warnings during codebook generation
  message = FALSE, # show messages during codebook generation
  error = TRUE, # do not interrupt codebook generation in case of errors,
                # usually better for debugging
  echo = TRUE  # show R code
)
ggplot2::theme_set(ggplot2::theme_bw())
# set base directory
basedir = "/home/ecco_rais/data/clean/RAIS-homogenized/output/"
# adjust as necessary
startyear = 2003
endyear = 2004
# libraries
library(codebook)
library(rio)
## The following rio suggested packages are not installed: 'arrow', 'hexView', 'pzfx', 'rmatio', 'readODS', 'qs'
## Use 'install_formats()' to install them
# Start the codebook loop
#for ( year in startyear:endyear) {
year = "2009"
    # for CSV
    codebook_data <- fread(file.path(basedir, paste0("harmo_", year, ".csv")))
    # omit the following lines, if your missing values are already properly labelled
    codebook_data <- detect_missing(codebook_data,
        only_labelled = TRUE, # only labelled values are autodetected as
                              # missing
        negative_values_are_missing = FALSE, # negative values are missing values
        ninety_nine_problems = TRUE,   # 99/999 are missing values, if they
                                      # are more than 5 MAD from the median
    )
    # If you are not using formr, the codebook package needs to guess which items
    # form a scale. The following line finds item aggregates with names like this:
    # scale = scale_1 + scale_2R + scale_3R
    # identifying these aggregates allows the codebook function to
    # automatically compute reliabilities.
    # However, it will not reverse items automatically.
    codebook_data <- detect_scales(codebook_data)
## Warning in detect_scales(codebook_data): cnae items found, but no aggregate
## Warning in detect_scales(codebook_data): active items found, but no aggregate
## Warning in detect_scales(codebook_data): cbo items found, but no aggregate
    codebook_data <- as.data.table(codebook_data)
    codebook(codebook_data)
## Warning in max(f): no non-missing arguments to max; returning -Inf
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
## Warning in max(f): no non-missing arguments to max; returning -Inf
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
## Warning: Couldn't find skimmers for class: integer64; No user-defined `sfl` provided. Falling
## back to `character`.
Dataset name: codebook_data
The dataset has N=61126896 rows and 47 columns. 25156272 rows have no missing values on any column.
  | 
#Variables
Distribution of values for adm_date
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| adm_date | numeric | 0 | 1 | 1e+06 | 4052009 | 3.1e+07 | 8246044 | 8387084 | ▇▂▂▂▁ | NA | 
Distribution of values for separation_cause
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| separation_cause | numeric | 0 | 1 | 0 | 0 | 80 | 4.913578 | 8.433527 | ▇▁▁▁▁ | NA | 
## Error in `ggplot2::geom_histogram()`:
## ! Problem while computing position.
## ℹ Error occurred in the 1st layer.
## Caused by error in `if (...) NULL`:
## ! missing value where TRUE/FALSE needed
0 missing values.
| name | data_type | n_missing | complete_rate | n_unique | empty | min | max | whitespace | label | 
|---|---|---|---|---|---|---|---|---|---|
| cei | character | 0 | 1 | 41349 | 0 | 1 | 21 | 0 | NA | 
Distribution of values for cnae20
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| cnae20 | numeric | 0 | 1 | 1113 | 47890 | 99008 | 54599.16 | 26784.19 | ▃▂▇▂▇ | NA | 
Distribution of values for cnae95
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| cnae95 | numeric | 0 | 1 | 1112 | 55131 | 99007 | 54757.21 | 23520.85 | ▃▂▇▇▂ | NA | 
## Error in `ggplot2::geom_histogram()`:
## ! Problem while computing position.
## ℹ Error occurred in the 1st layer.
## Caused by error in `if (...) NULL`:
## ! missing value where TRUE/FALSE needed
0 missing values.
| name | data_type | n_missing | complete_rate | n_unique | empty | min | max | whitespace | label | 
|---|---|---|---|---|---|---|---|---|---|
| cpf | character | 0 | 1 | 49917076 | 0 | 1 | 21 | 0 | NA | 
Distribution of values for dob
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| dob | numeric | 0 | 1 | 1e+06 | 1.5e+07 | 3.1e+07 | 15637746 | 8783222 | ▇▇▇▇▇ | NA | 
Distribution of values for active1231
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| active1231 | numeric | 0 | 1 | 0 | 1 | 1 | 0.6741312 | 0.4686986 | ▃▁▁▁▇ | NA | 
Distribution of values for sex
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| sex | numeric | 0 | 1 | 0 | 0 | 1 | 0.3968938 | 0.4892536 | ▇▁▁▁▅ | NA | 
Distribution of values for schooling
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| schooling | numeric | 0 | 1 | 1 | 7 | 11 | 6.221959 | 1.89172 | ▂▃▇▃▁ | NA | 
Distribution of values for hired_hours
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| hired_hours | numeric | 0 | 1 | 1 | 44 | 44 | 41.29789 | 6.309537 | ▁▁▁▁▇ | NA | 
## Error in `ggplot2::geom_histogram()`:
## ! Problem while computing stat.
## ℹ Error occurred in the 1st layer.
## Caused by error in `seq_len()`:
## ! argument must be coercible to non-negative integer
0 missing values.
| name | data_type | n_missing | complete_rate | n_unique | empty | min | max | whitespace | label | 
|---|---|---|---|---|---|---|---|---|---|
| firmID | character | 0 | 1 | 3185547 | 0 | 15 | 21 | 0 | NA | 
Distribution of values for alvara_ind
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| alvara_ind | numeric | 0 | 1 | 1 | 2 | 2 | 1.9997 | 0.0173099 | ▁▁▁▁▇ | NA | 
Distribution of values for cei_avail
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| cei_avail | numeric | 0 | 1 | 0 | 0 | 1 | 0.0202863 | 0.1409778 | ▇▁▁▁▁ | NA | 
Distribution of values for pat
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| pat | numeric | 0 | 1 | 0 | 0 | 1 | 0.2951455 | 0.4561082 | ▇▁▁▁▃ | NA | 
Distribution of values for simples
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| simples | numeric | 0 | 1 | 0 | 0 | 1 | 0.2155727 | 0.4112191 | ▇▁▁▁▂ | NA | 
Distribution of values for termination_month
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| termination_month | numeric | 0 | 1 | 0 | 0 | 12 | 2.168538 | 3.719281 | ▇▁▁▁▁ | NA | 
Distribution of values for muni
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| muni | numeric | 0 | 1 | 110001 | 351880 | 530010 | 345912.5 | 85144.28 | ▁▂▇▂▁ | NA | 
Distribution of values for nationality
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| nationality | numeric | 0 | 1 | 10 | 10 | 50 | 10.03189 | 0.9694217 | ▇▁▁▁▁ | NA | 
Distribution of values for legal_form
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| legal_form | numeric | 0 | 1 | -1 | 2062 | 5037 | 2045.251 | 678.1847 | ▁▂▇▁▁ | NA | 
Distribution of values for name
0 missing values.
| name | data_type | n_missing | complete_rate | n_unique | empty | min | max | whitespace | label | 
|---|---|---|---|---|---|---|---|---|---|
| name | character | 0 | 1 | 36140538 | 0 | 5 | 52 | 0 | NA | 
Distribution of values for ctps
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| ctps | numeric | 0 | 1 | 0 | 56585 | 1e+08 | 753905.6 | 3182637 | ▇▁▁▁▁ | NA | 
Distribution of values for cbo02
638901 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| cbo02 | numeric | 638901 | 0.989548 | 111215 | 514320 | 992225 | 521788.6 | 200032.8 | ▃▇▇▆▂ | NA | 
Distribution of values for cbo94
6550385 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| cbo94 | numeric | 6550385 | 0.8928396 | 12110 | 53260 | 99190 | 56355.81 | 26588.42 | ▃▇▅▂▆ | NA | 
## Error in `ggplot2::geom_histogram()`:
## ! Problem while computing stat.
## ℹ Error occurred in the 1st layer.
## Caused by error in `seq_len()`:
## ! argument must be coercible to non-negative integer
0 missing values.
| name | data_type | n_missing | complete_rate | n_unique | empty | min | max | whitespace | label | 
|---|---|---|---|---|---|---|---|---|---|
| pis | character | 0 | 1 | 50219948 | 0 | 13 | 21 | 0 | NA | 
Distribution of values for disabled
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| disabled | numeric | 0 | 1 | 0 | 1 | 1 | 0.9936983 | 0.0791328 | ▁▁▁▁▇ | NA | 
Distribution of values for race_color
9292848 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| race_color | numeric | 9292848 | 0.8479745 | 1 | 2 | 9 | 4.185512 | 2.862658 | ▇▁▁▁▅ | NA | 
Distribution of values for cnpj_root
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| cnpj_root | numeric | 0 | 1 | 0 | 9053646 | 1e+08 | 24801927 | 27972576 | ▇▁▂▁▁ | NA | 
Distribution of values for earn_dec
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| earn_dec | numeric | 0 | 1 | 0 | 628 | 69751 | 1085.789 | 2141.894 | ▇▁▁▁▁ | NA | 
Distribution of values for earn_dec_mw
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| earn_dec_mw | numeric | 0 | 1 | 0 | 1.4 | 150 | 2.331877 | 4.60537 | ▇▁▁▁▁ | NA | 
Distribution of values for mean_earn
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| mean_earn | numeric | 0 | 1 | 0 | 775 | 69750 | 1342.41 | 2065.947 | ▇▁▁▁▁ | NA | 
Distribution of values for mean_earn_mw
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| mean_earn_mw | numeric | 0 | 1 | 0 | 1.7 | 150 | 2.914609 | 4.512326 | ▇▁▁▁▁ | NA | 
Distribution of values for hired_wage
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| hired_wage | numeric | 0 | 1 | 0 | 620 | 1e+07 | 1009.998 | 12408.51 | ▇▁▁▁▁ | NA | 
Distribution of values for cnae20sub
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| cnae20sub | numeric | 0 | 1 | 111301 | 4789099 | 9900800 | 5459925 | 2678417 | ▃▂▇▂▇ | NA | 
Distribution of values for establishment_size
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| establishment_size | numeric | 0 | 1 | 0 | 6 | 9 | 5.387119 | 2.83178 | ▃▅▅▅▇ | NA | 
Distribution of values for tenure
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| tenure | numeric | 0 | 1 | 0 | 16 | 600 | 46.9931 | 73.93539 | ▇▁▁▁▁ | NA | 
Distribution of values for adm_type
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| adm_type | numeric | 0 | 1 | 0 | 0 | 8 | 0.7133586 | 1.017163 | ▇▃▁▁▁ | NA | 
Distribution of values for firmID_type
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| firmID_type | numeric | 0 | 1 | 0 | 1 | 1 | 0.9639371 | 0.1864468 | ▁▁▁▁▇ | NA | 
Distribution of values for wage_type
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| wage_type | numeric | 0 | 1 | 1 | 1 | 7 | 1.41541 | 1.245704 | ▇▁▁▁▁ | NA | 
Distribution of values for disability_type
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| disability_type | numeric | 0 | 1 | 0 | 0 | 6 | 0.0130432 | 0.2092178 | ▇▁▁▁▁ | NA | 
Distribution of values for contract_type
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| contract_type | numeric | 0 | 1 | 10 | 10 | 97 | 16.24178 | 13.4311 | ▇▂▁▁▁ | NA | 
Distribution of values for last_wage
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| last_wage | numeric | 0 | 1 | 0 | 1.7 | 150 | 3.218682 | 5.772439 | ▇▁▁▁▁ | NA | 
Distribution of values for yr
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| yr | numeric | 0 | 1 | 2009 | 2009 | 2009 | 2009 | 0 | ▁▁▇▁▁ | NA | 
Distribution of values for termination_year
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| termination_year | numeric | 0 | 1 | 2009 | 2009 | 2009 | 2009 | 0 | ▁▁▇▁▁ | NA | 
Distribution of values for adm_day
27223470 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| adm_day | numeric | 27223470 | 0.5546401 | 1 | 13 | 31 | 13.59446 | 7.786268 | ▇▇▇▅▂ | NA | 
Distribution of values for adm_month
4416667 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| adm_month | numeric | 4416667 | 0.9277459 | 1 | 6 | 12 | 6.043135 | 3.220171 | ▇▅▅▆▅ | NA | 
Distribution of values for adm_year
0 missing values.
| name | data_type | n_missing | complete_rate | min | median | max | mean | sd | hist | label | 
|---|---|---|---|---|---|---|---|---|---|---|
| adm_year | numeric | 0 | 1 | 1929 | 2008 | 2009 | 2005.445 | 6.093912 | ▁▁▁▁▇ | NA | 
The following JSON-LD can be found by search engines, if you share this codebook publicly on the web.
{
  "name": "codebook_data",
  "datePublished": "2024-06-01",
  "description": "The dataset has N=61126896 rows and 47 columns.\n25156272 rows have no missing values on any column.\n\n\n## Table of variables\nThis table contains variable names, labels, and number of missing values.\nSee the complete codebook for more.\n\n|name               |label | n_missing|\n|:------------------|:-----|---------:|\n|adm_date           |NA    |         0|\n|separation_cause   |NA    |         0|\n|cei                |NA    |         0|\n|cnae20             |NA    |         0|\n|cnae95             |NA    |         0|\n|cpf                |NA    |         0|\n|dob                |NA    |         0|\n|active1231         |NA    |         0|\n|sex                |NA    |         0|\n|schooling          |NA    |         0|\n|hired_hours        |NA    |         0|\n|firmID             |NA    |         0|\n|alvara_ind         |NA    |         0|\n|cei_avail          |NA    |         0|\n|pat                |NA    |         0|\n|simples            |NA    |         0|\n|termination_month  |NA    |         0|\n|muni               |NA    |         0|\n|nationality        |NA    |         0|\n|legal_form         |NA    |         0|\n|name               |NA    |         0|\n|ctps               |NA    |         0|\n|cbo02              |NA    |    638901|\n|cbo94              |NA    |   6550385|\n|pis                |NA    |         0|\n|disabled           |NA    |         0|\n|race_color         |NA    |   9292848|\n|cnpj_root          |NA    |         0|\n|earn_dec           |NA    |         0|\n|earn_dec_mw        |NA    |         0|\n|mean_earn          |NA    |         0|\n|mean_earn_mw       |NA    |         0|\n|hired_wage         |NA    |         0|\n|cnae20sub          |NA    |         0|\n|establishment_size |NA    |         0|\n|tenure             |NA    |         0|\n|adm_type           |NA    |         0|\n|firmID_type        |NA    |         0|\n|wage_type          |NA    |         0|\n|disability_type    |NA    |         0|\n|contract_type      |NA    |         0|\n|last_wage          |NA    |         0|\n|yr                 |NA    |         0|\n|termination_year   |NA    |         0|\n|adm_day            |NA    |  27223470|\n|adm_month          |NA    |   4416667|\n|adm_year           |NA    |         0|\n\n### Note\nThis dataset was automatically described using the [codebook R package](https://rubenarslan.github.io/codebook/) (version 0.9.2).",
  "keywords": ["adm_date", "separation_cause", "cei", "cnae20", "cnae95", "cpf", "dob", "active1231", "sex", "schooling", "hired_hours", "firmID", "alvara_ind", "cei_avail", "pat", "simples", "termination_month", "muni", "nationality", "legal_form", "name", "ctps", "cbo02", "cbo94", "pis", "disabled", "race_color", "cnpj_root", "earn_dec", "earn_dec_mw", "mean_earn", "mean_earn_mw", "hired_wage", "cnae20sub", "establishment_size", "tenure", "adm_type", "firmID_type", "wage_type", "disability_type", "contract_type", "last_wage", "yr", "termination_year", "adm_day", "adm_month", "adm_year"],
  "@context": "http://schema.org/",
  "@type": "Dataset",
  "variableMeasured": [
    {
      "name": "adm_date",
      "@type": "propertyValue"
    },
    {
      "name": "separation_cause",
      "@type": "propertyValue"
    },
    {
      "name": "cei",
      "@type": "propertyValue"
    },
    {
      "name": "cnae20",
      "@type": "propertyValue"
    },
    {
      "name": "cnae95",
      "@type": "propertyValue"
    },
    {
      "name": "cpf",
      "@type": "propertyValue"
    },
    {
      "name": "dob",
      "@type": "propertyValue"
    },
    {
      "name": "active1231",
      "@type": "propertyValue"
    },
    {
      "name": "sex",
      "@type": "propertyValue"
    },
    {
      "name": "schooling",
      "@type": "propertyValue"
    },
    {
      "name": "hired_hours",
      "@type": "propertyValue"
    },
    {
      "name": "firmID",
      "@type": "propertyValue"
    },
    {
      "name": "alvara_ind",
      "@type": "propertyValue"
    },
    {
      "name": "cei_avail",
      "@type": "propertyValue"
    },
    {
      "name": "pat",
      "@type": "propertyValue"
    },
    {
      "name": "simples",
      "@type": "propertyValue"
    },
    {
      "name": "termination_month",
      "@type": "propertyValue"
    },
    {
      "name": "muni",
      "@type": "propertyValue"
    },
    {
      "name": "nationality",
      "@type": "propertyValue"
    },
    {
      "name": "legal_form",
      "@type": "propertyValue"
    },
    {
      "name": "name",
      "@type": "propertyValue"
    },
    {
      "name": "ctps",
      "@type": "propertyValue"
    },
    {
      "name": "cbo02",
      "@type": "propertyValue"
    },
    {
      "name": "cbo94",
      "@type": "propertyValue"
    },
    {
      "name": "pis",
      "@type": "propertyValue"
    },
    {
      "name": "disabled",
      "@type": "propertyValue"
    },
    {
      "name": "race_color",
      "@type": "propertyValue"
    },
    {
      "name": "cnpj_root",
      "@type": "propertyValue"
    },
    {
      "name": "earn_dec",
      "@type": "propertyValue"
    },
    {
      "name": "earn_dec_mw",
      "@type": "propertyValue"
    },
    {
      "name": "mean_earn",
      "@type": "propertyValue"
    },
    {
      "name": "mean_earn_mw",
      "@type": "propertyValue"
    },
    {
      "name": "hired_wage",
      "@type": "propertyValue"
    },
    {
      "name": "cnae20sub",
      "@type": "propertyValue"
    },
    {
      "name": "establishment_size",
      "@type": "propertyValue"
    },
    {
      "name": "tenure",
      "@type": "propertyValue"
    },
    {
      "name": "adm_type",
      "@type": "propertyValue"
    },
    {
      "name": "firmID_type",
      "@type": "propertyValue"
    },
    {
      "name": "wage_type",
      "@type": "propertyValue"
    },
    {
      "name": "disability_type",
      "@type": "propertyValue"
    },
    {
      "name": "contract_type",
      "@type": "propertyValue"
    },
    {
      "name": "last_wage",
      "@type": "propertyValue"
    },
    {
      "name": "yr",
      "@type": "propertyValue"
    },
    {
      "name": "termination_year",
      "@type": "propertyValue"
    },
    {
      "name": "adm_day",
      "@type": "propertyValue"
    },
    {
      "name": "adm_month",
      "@type": "propertyValue"
    },
    {
      "name": "adm_year",
      "@type": "propertyValue"
    }
  ]
}`
 # } # end year loop