Compare commits
No commits in common. "main" and "0.5.0" have entirely different histories.
316 changed files with 2721 additions and 10504 deletions
.gitignore
00-notebooks
02-data
intermediate
processed
extracted.csv
irrelevant
AlbujaEcheverria2021.DISABLEDClibborn2022.DISABLEDDumas2018.DISABLEDEckardt2022.yml.DISABLEDElveren2013.DISABLEDMhando2020.DISABLEDSaleh2018.DISABLEDdeGeus2022.DISABLED
relevant
Adam2018.ymlAdams2015.ymlAhumada2023.ymlAl-Mamun2014.ymlAlexiou2023.ymlAlinaghi2020.ymlBailey2012.ymlBartha2020.ymlBlumenberg2014.ymlBroadway2020.ymlCardinaleschi2019.ymlCarstens2018.ymlChao2022.ymlCieplinski2021.ymlClark2019.ymlCoutinho2006.ymlDavies2022.ymlDebowicz2014.ymlDelesalle2021.ymlDieckhoff2015.ymlDustmann2012.ymlEmigh2018.ymlFerguson2015.ymlField2019.ymlGates2000.ymlGilbert2001.ymlGo2010.ymlHardoy2015.ymlHojman2019.ymlKhan2021.ymlKuriyama2021.ymlLi2022.ymlLiyanaarachchi2016.ymlMilitaru2019.ymlMukhopadhaya2003.ymlMun2018.ymlPi2016.ymlPoppen2017.ymlRendall2013.ymlRosen2014.ymlShepherd-Banigan2021.ymlShin2006.ymlSilveiraNeto2011.ymlSotomayor2021.ymlStanding2015.ymlStock2021.ymlSuh2017.ymlThoresen2021.ymlWang2016.ymlWang2020.ymlWhitworth2021.ymlWong2019.ymlXu2021.yml
raw
01_wos-sample_2023-11-02
02_snowballing-starts
Bishu2017
Chamhuri2012
Chang2021
Crowther2001
Curran2022
Duflo2012
Finlay2021
Fortune2022
14
.gitignore
vendored
14
.gitignore
vendored
|
@ -1,14 +1,6 @@
|
|||
/documentation/DB
|
||||
/documentation/library
|
||||
/output
|
||||
/manuscript/*_files/
|
||||
|
||||
# Elsevier journal target:
|
||||
# Ignore bibliography style, spl (for natbib?) and latex class
|
||||
# since they don't get deleted after compilation
|
||||
*.spl
|
||||
*.bst
|
||||
*.cls
|
||||
/03-documentation/DB
|
||||
/03-documentation/library
|
||||
/04-outputs
|
||||
|
||||
# Created by https://www.toptal.com/developers/gitignore/api/-f,python,linux,vim,quarto,markdown,jupyternotebooks
|
||||
# Edit at https://www.toptal.com/developers/gitignore?templates=-f,python,linux,vim,quarto,markdown,jupyternotebooks
|
||||
|
|
|
@ -1,5 +1,5 @@
|
|||
---
|
||||
bibliography: ../data/intermediate/zotero-library.bib
|
||||
bibliography: ../02-data/intermediate/zotero-library.bib
|
||||
csl: /home/marty/documents/library/utilities/styles/APA-7.csl
|
||||
papersize: A4
|
||||
linestretch: 1.5
|
||||
|
@ -22,8 +22,7 @@ subtitle: Addressing inequalities in the World of Work
|
|||
```{python}
|
||||
#| echo: false
|
||||
from pathlib import Path
|
||||
import src.globals as g
|
||||
data_dir = g.DATA_DIR
|
||||
data_dir=Path("../02-data")
|
||||
|
||||
## standard imports
|
||||
from IPython.core.display import Markdown as md
|
||||
|
@ -44,9 +43,8 @@ sns.set_style("whitegrid")
|
|||
import bibtexparser
|
||||
|
||||
bib_string=""
|
||||
sample_dir = g.REFERENCE_DATA.joinpath("01_wos-sample_2023-11-02")
|
||||
print(f"path: {sample_dir.absolute()}")
|
||||
for partial_bib in sample_dir.glob("*.bib"):
|
||||
print(f"path: {data_dir.joinpath('raw/01_wos-sample_2023-11-02').absolute()}")
|
||||
for partial_bib in data_dir.joinpath("raw/01_wos-sample_2023-11-02").glob("*.bib"):
|
||||
with open(partial_bib) as f:
|
||||
bib_string+="\n".join(f.readlines())
|
||||
sample = bibtexparser.parse_string(bib_string)
|
|
@ -1,5 +1,5 @@
|
|||
---
|
||||
bibliography: data/intermediate/zotero-library.bib
|
||||
bibliography: 02-data/intermediate/zotero-library.bib
|
||||
title: Grab yml
|
||||
---
|
||||
|
||||
|
@ -184,18 +184,23 @@ from matplotlib import pyplot as plt
|
|||
import seaborn as sns
|
||||
from tabulate import tabulate
|
||||
import bibtexparser
|
||||
import src.globals as g
|
||||
|
||||
sns.set_style("whitegrid")
|
||||
|
||||
DATA_DIR=Path("./02-data")
|
||||
RAW_DATA=DATA_DIR.joinpath("raw")
|
||||
WORKING_DATA=DATA_DIR.joinpath("intermediate")
|
||||
PROCESSED_DATA=DATA_DIR.joinpath("processed")
|
||||
SUPPLEMENTARY_DATA=DATA_DIR.joinpath("supplementary")
|
||||
|
||||
bib_string=""
|
||||
for partial_bib in g.REFERENCE_DATA.glob("**/*.bib"):
|
||||
for partial_bib in RAW_DATA.glob("**/*.bib"):
|
||||
with open(partial_bib) as f:
|
||||
bib_string+="\n".join(f.readlines())
|
||||
bib_sample_raw_db = bibtexparser.parse_string(bib_string)
|
||||
|
||||
bib_string=""
|
||||
for partial_bib in g.REFERENCE_DATA.joinpath("zotero-library.bib"):
|
||||
for partial_bib in WORKING_DATA.glob("**/*.bib"):
|
||||
with open(partial_bib) as f:
|
||||
bib_string+="\n".join(f.readlines())
|
||||
bib_sample = bibtexparser.parse_string(bib_string)
|
||||
|
@ -217,10 +222,10 @@ zot_df = pd.DataFrame([
|
|||
], columns = ["doi", "cited", "usage", "keywords"]).drop_duplicates("doi").set_index("doi")
|
||||
|
||||
# Add WB country grouping definitions (income group, world region)
|
||||
WB_COUNTRY_GROUPS_FILE = Path(f"{g.SUPPLEMENTARY_DATA}/wb-country-groupings.xlsx").resolve()
|
||||
WB_COUNTRY_GROUPS_FILE = Path(f"{SUPPLEMENTARY_DATA}/wb-country-groupings.xlsx").resolve()
|
||||
df_country_groups = pd.read_excel(WB_COUNTRY_GROUPS_FILE).set_index("Economy")
|
||||
|
||||
bib_df = (load_data.from_yml(f"{g.PROCESSED_DATA}")
|
||||
bib_df = (load_data.from_yml(f"{PROCESSED_DATA}")
|
||||
.assign(
|
||||
doi=lambda _df: _df["uri"].str.extract(r"https?://(?:dx\.)?doi\.org/(.*)", expand=False),
|
||||
zot_cited=lambda _df: _df["doi"].map(zot_df["cited"]),
|
|
@ -15,7 +15,7 @@ import bibtexparser
|
|||
|
||||
sns.set_style("whitegrid")
|
||||
|
||||
DATA_DIR=Path("./data")
|
||||
DATA_DIR=Path("./02-data")
|
||||
RAW_DATA=DATA_DIR.joinpath("raw")
|
||||
WORKING_DATA=DATA_DIR.joinpath("intermediate")
|
||||
PROCESSED_DATA=DATA_DIR.joinpath("processed")
|
||||
|
@ -120,7 +120,7 @@ datavis:
|
|||
|
||||
|
||||
```{python}
|
||||
findings_institutional = pd.read_csv("data/supplementary/findings-institutional.csv")
|
||||
findings_institutional = pd.read_csv("02-data/supplementary/findings-institutional.csv")
|
||||
findings_institutional
|
||||
from src.model import validity
|
||||
import math
|
|
@ -16,7 +16,7 @@ import bibtexparser
|
|||
|
||||
sns.set_style("whitegrid")
|
||||
|
||||
DATA_DIR=Path("./data")
|
||||
DATA_DIR=Path("./02-data")
|
||||
RAW_DATA=DATA_DIR.joinpath("raw")
|
||||
WORKING_DATA=DATA_DIR.joinpath("intermediate")
|
||||
PROCESSED_DATA=DATA_DIR.joinpath("processed")
|
|
@ -1,5 +1,5 @@
|
|||
---
|
||||
bibliography: data/intermediate/zotero-library.bib
|
||||
bibliography: 02-data/intermediate/zotero-library.bib
|
||||
csl: /home/marty/documents/library/utilities/styles/APA-7.csl
|
||||
papersize: A4
|
||||
linestretch: 1.5
|
||||
|
@ -28,10 +28,8 @@ zotero:
|
|||
```{python}
|
||||
#| echo: false
|
||||
from pathlib import Path
|
||||
import src.globals as g
|
||||
DATA_DIR = g.DATA_DIR
|
||||
RAW_DATA = g.RAW_DATA
|
||||
BIB_PATH = g.REFERENCE_DATA.joinpath("01_wos-sample_2023-11-02")
|
||||
DATA_DIR=Path("./02-data")
|
||||
BIB_PATH = DATA_DIR.joinpath("raw/01_wos-sample_2023-11-02")
|
||||
|
||||
## standard imports
|
||||
from IPython.core.display import Markdown as md
|
File diff suppressed because one or more lines are too long
|
@ -15,7 +15,7 @@ group: working mothers
|
|||
data: national administrative Social Security Records (1975-2008)
|
||||
|
||||
design: quasi-experimental
|
||||
method: difference-in-difference analysis; regression discontinuity
|
||||
method: difference-in-difference analysis
|
||||
sample: 13000
|
||||
unit: individual
|
||||
representativeness: national, census
|
Some files were not shown because too many files have changed in this diff Show more
Loading…
Reference in a new issue