Exemplos de highlighted_text em Python, exemplos de Main.highlighted_text em Python

Exemplo n.º 1

0

Exibir arquivo

Arquivo: Age.py Projeto: JonathanReardon/ToolkitExtraction

student_age_df["part_age_8"]=student_age_df["part_age_raw"].map(set(['8']).issubset).astype(int)
student_age_df["part_age_9"]=student_age_df["part_age_raw"].map(set(['9']).issubset).astype(int)
student_age_df["part_age_10"]=student_age_df["part_age_raw"].map(set(['10']).issubset).astype(int)
student_age_df["part_age_11"]=student_age_df["part_age_raw"].map(set(['11']).issubset).astype(int)
student_age_df["part_age_12"]=student_age_df["part_age_raw"].map(set(['12']).issubset).astype(int)
student_age_df["part_age_13"]=student_age_df["part_age_raw"].map(set(['13']).issubset).astype(int)
student_age_df["part_age_14"]=student_age_df["part_age_raw"].map(set(['14']).issubset).astype(int)
student_age_df["part_age_15"]=student_age_df["part_age_raw"].map(set(['15']).issubset).astype(int)
student_age_df["part_age_16"]=student_age_df["part_age_raw"].map(set(['16']).issubset).astype(int)
student_age_df["part_age_17"]=student_age_df["part_age_raw"].map(set(['17']).issubset).astype(int)
student_age_df["part_age_18"]=student_age_df["part_age_raw"].map(set(['18']).issubset).astype(int)

student_age_df["part_age_no_information_provided"]=student_age_df["part_age_raw"].map(set(['No information provided']).issubset).astype(int) """

# get student age highlighted text
student_age_HT = highlighted_text(student_age_output)
student_age_HT_df = pd.DataFrame(student_age_HT)
student_age_HT_df = student_age_HT_df.T
student_age_HT_df.columns = ["part_age_ht"]

# get student age user comments
student_age_Comments = comments(student_age_output)
student_age_Comments_df = pd.DataFrame(student_age_Comments)
student_age_Comments_df = student_age_Comments_df.T
student_age_Comments_df.columns = ["part_age_info"]

# concatenate data frames
student_age = pd.concat(
    [student_age_df, student_age_HT_df, student_age_Comments_df],
    axis=1,
    sort=False)

Exemplo n.º 2

0

Exibir arquivo

Arquivo: InterventionDescription.py Projeto: JonathanReardon/ToolkitExtraction

from Main import load_json, comments, highlighted_text
from AttributeIDList import intervention_description_output
import pandas as pd

# load json file
load_json()

# get intervention description highlighted text
Intervention_DescriptionHT = highlighted_text(intervention_description_output)
Intervention_DescriptionHT_df = pd.DataFrame(Intervention_DescriptionHT)
Intervention_DescriptionHT_df = Intervention_DescriptionHT_df.T
Intervention_DescriptionHT_df.columns = ["int_desc_ht"]

# get intervention description user comments
Intervention_Description_Comments = comments(intervention_description_output)
Intervention_Description_Comments_df = pd.DataFrame(
    Intervention_Description_Comments)
Intervention_Description_Comments_df = Intervention_Description_Comments_df.T
Intervention_Description_Comments_df.columns = ["int_desc_info"]

# concatenate dataframes
intervention_description_df = pd.concat(
    [Intervention_DescriptionHT_df, Intervention_Description_Comments_df],
    axis=1,
    sort=False)

# remove problematic text
intervention_description_df.replace('\r', ' ', regex=True, inplace=True)
intervention_description_df.replace('\n', ' ', regex=True, inplace=True)
intervention_description_df.replace(':', ' ', regex=True, inplace=True)
intervention_description_df.replace(';', ' ', regex=True, inplace=True)

Exemplo n.º 3

0

Exibir arquivo

Arquivo: SampleSize.py Projeto: JonathanReardon/ToolkitExtraction

from Main import load_json, comments, highlighted_text
from AttributeIDList import sample_size_output
import pandas as pd

# load json file
load_json()

# get sample size comments
sample_size_Comments = comments(sample_size_output)
sample_size_Comments_df = pd.DataFrame(sample_size_Comments)
sample_size_Comments_df = sample_size_Comments_df.T
sample_size_Comments_df.columns = ["sample_analysed_info"]

# get sample size highlighted text
sample_size_HT = highlighted_text(sample_size_output)
sample_size_HT_df = pd.DataFrame(sample_size_HT)
sample_size_HT_df = sample_size_HT_df.T
sample_size_HT_df.columns = ["sample_analysed_ht"]

# concatenate dataframes
sample_size_df = pd.concat([sample_size_Comments_df, sample_size_HT_df],
                           axis=1,
                           sort=False)

# remove problematic text
sample_size_df.replace('\r', ' ', regex=True, inplace=True)
sample_size_df.replace('\n', ' ', regex=True, inplace=True)

# fill blanks with NA
sample_size_df.fillna("NA", inplace=True)

Exemplo n.º 4

0

Exibir arquivo

Arquivo: LocationInformation.py Projeto: JonathanReardon/ToolkitExtraction

# load json file
load_json()
""" # Get More Location Information highlighted text
more_location_info_HT = highlighted_text(more_location_info)
more_location_info_HT_df = pd.DataFrame(more_location_info_HT)
more_location_info_HT_df = more_location_info_HT_df.T
more_location_info_HT_df.columns = ["More_Location_information_HT"]

# Get More Location Information comments
more_location_info_Comments = comments(more_location_info)
more_location_info_Comments_df = pd.DataFrame(more_location_info_Comments)
more_location_info_Comments_df = more_location_info_Comments_df.T
more_location_info_Comments_df.columns = ["More_Location_Information_comments"] """

# Get Location Specific Information highlighted text
location_specific_info_HT = highlighted_text(specific_to_location)
location_specific_info_HT_df = pd.DataFrame(location_specific_info_HT)
location_specific_info_HT_df = location_specific_info_HT_df.T
location_specific_info_HT_df.columns = ["loc_spec_ht"]

# Get Location Specific Information comments
location_specific_info_Comments = comments(specific_to_location)
location_specific_info_Comments_df = pd.DataFrame(
    location_specific_info_Comments)
location_specific_info_Comments_df = location_specific_info_Comments_df.T
location_specific_info_Comments_df.columns = ["loc_spec_info"]

# Get Type of Location highlighted text
type_of_location_info_HT = highlighted_text(type_of_location)
type_of_location_info_HT_df = pd.DataFrame(type_of_location_info_HT)
type_of_location_info_HT_df = type_of_location_info_HT_df.T

Exemplo n.º 5

0

Exibir arquivo

from Main import load_json, comments, highlighted_text
from AttributeIDList import sample_size_intervention_output
from AttributeIDList import sample_size_control_output
from AttributeIDList import sample_size_second_intervention_output
from AttributeIDList import sample_size_third_intervention_output
import pandas as pd

# load json file
load_json()

#############################################
# Initial sample size for intervention group
#############################################

# get sample size intervention highlighted text
sample_size_intervention_HT = highlighted_text(sample_size_intervention_output)
sample_size_intervention_HT_df = pd.DataFrame(sample_size_intervention_HT)
sample_size_intervention_HT_df = sample_size_intervention_HT_df.T
sample_size_intervention_HT_df.columns = ["base_n_treat_ht"]

# get sample size intervention
sample_size_intervention_Comments = comments(sample_size_intervention_output)
sample_size_intervention_Comments_df = pd.DataFrame(
    sample_size_intervention_Comments)
sample_size_intervention_Comments_df = sample_size_intervention_Comments_df.T
sample_size_intervention_Comments_df.columns = ["base_n_treat_info"]

############################################
# Initial sample size for the control group
############################################

Exemplo n.º 6

0

Exibir arquivo

from AttributeIDList import edu_setting_output
import pandas as pd

# get educational setting data
edusetting = get_data(edu_setting_output)
edusetting_df = pd.DataFrame(edusetting)
edusetting_df = edusetting_df.T
edusetting_df.columns=["int_setting_raw"]

# binarize educational setting data
""" edusetting_df["int_setting_primary/elementary_school"] = edusetting_df["int_setting_raw"].map(set(['Primary/elementary school']).issubset).astype(int)
edusetting_df["int_setting_middle_school"] = edusetting_df["int_setting_raw"].map(set(['Middle school']).issubset).astype(int)
edusetting_df["int_setting_secondary/high_school"] = edusetting_df["int_setting_raw"].map(set(['Secondary/High school']).issubset).astype(int) """

# Get Educational Setting highlighted text
edusetting_HT = highlighted_text(edu_setting_output)
edusetting_HT_df = pd.DataFrame(edusetting_HT)
edusetting_HT_df = edusetting_HT_df.T
edusetting_HT_df.columns = ["int_setting_ht"]

# Get Educational Setting user comments
edusetting_Comments = comments(edu_setting_output)
edusetting_Comments_df = pd.DataFrame(edusetting_Comments)
edusetting_Comments_df = edusetting_Comments_df.T
edusetting_Comments_df.columns = ["int_setting_info"]

# concatenate data frames
educational_setting_df = pd.concat([
    edusetting_df, 
    edusetting_HT_df, 
    edusetting_Comments_df

Exemplo n.º 7

0

Exibir arquivo

Arquivo: InterventionDuration.py Projeto: JonathanReardon/ToolkitExtraction

from Main import load_json, comments, highlighted_text
from AttributeIDList import intervention_duration_output
import pandas as pd

# load json file
load_json()

# get intervention duration highlighted text
InterventionDuration_HT = highlighted_text(intervention_duration_output)
InterventionDuration_HT_df = pd.DataFrame(InterventionDuration_HT)
InterventionDuration_HT_df = InterventionDuration_HT_df.T
InterventionDuration_HT_df.columns = ["int_dur_ht"]

# get intervention duration user comments
InterventionDuration_Comments = comments(intervention_duration_output)
InterventionDuration_Comments_df = pd.DataFrame(InterventionDuration_Comments)
InterventionDuration_Comments_df = InterventionDuration_Comments_df.T
InterventionDuration_Comments_df.columns = ["int_dur_info"]

# concatenate data frames
intervention_duration_df = pd.concat(
    [InterventionDuration_HT_df, InterventionDuration_Comments_df],
    axis=1,
    sort=False)

# Remove problematic text (potential escape sequences) from text input
intervention_duration_df.replace('\r', ' ', regex=True, inplace=True)
intervention_duration_df.replace('\n', ' ', regex=True, inplace=True)
intervention_duration_df.replace(':', ' ', regex=True, inplace=True)
intervention_duration_df.replace(';', ' ', regex=True, inplace=True)

Exemplo n.º 8

0

Exibir arquivo

Arquivo: NumberofClasses.py Projeto: JonathanReardon/ToolkitExtraction

load_json()

##################################
# NUMBER OF CLASSES INTERVENTION #
##################################

# get number of classes intervention comments data
number_of_classes_intervention_Comments = comments(
    number_of_classes_intervention_output)
number_of_classes_intervention_Comments_df = pd.DataFrame(
    number_of_classes_intervention_Comments)
number_of_classes_intervention_Comments_df = number_of_classes_intervention_Comments_df.T
number_of_classes_intervention_Comments_df.columns = ["class_treat_info"]

# get number of classes intervention highlighted text data
number_of_classes_intervention_HT = highlighted_text(
    number_of_classes_intervention_output)
number_of_classes_intervention_HT_df = pd.DataFrame(
    number_of_classes_intervention_HT)
number_of_classes_intervention_HT_df = number_of_classes_intervention_HT_df.T
number_of_classes_intervention_HT_df.columns = ["class_treat_ht"]

#############################
# NUMBER OF CLASSES CONTROL #
#############################

# get number of classes control comments data
number_of_classes_control_Comments = comments(number_of_classes_control_output)
number_of_classes_control_Comments_df = pd.DataFrame(
    number_of_classes_control_Comments)
number_of_classes_control_Comments_df = number_of_classes_control_Comments_df.T
number_of_classes_control_Comments_df.columns = ["class_cont_info"]

Exemplo n.º 9

0

Exibir arquivo

Arquivo: Randomisation.py Projeto: JonathanReardon/ToolkitExtraction

from Main import load_json, get_data, comments, highlighted_text
from AttributeIDList import randomisation_details
import pandas as pd

# load json file
load_json()

# get randomisation data
randomisation = get_data(randomisation_details)
randomisation_df = pd.DataFrame(randomisation)
randomisation_df = randomisation_df.T
randomisation_df.columns = ["rand_raw"]

# Get Randomisation highlighted text
randomisation_HT = highlighted_text(randomisation_details)
randomisation_details_df = pd.DataFrame(randomisation_HT)
randomisation_details_df = randomisation_details_df.T
randomisation_details_df.columns = ["rand_ht"]

# Get Randomisation user comments
randomisation_Comments = comments(randomisation_details)
randomisation_Comments_df = pd.DataFrame(randomisation_Comments)
randomisation_Comments_df = randomisation_Comments_df.T
randomisation_Comments_df.columns = ["rand_info"]

# concatenate data frames
randomisation_df = pd.concat(
    [randomisation_df, randomisation_details_df, randomisation_Comments_df],
    axis=1,
    sort=False)

Exemplo n.º 10

0

Exibir arquivo

Arquivo: Clustering.py Projeto: JonathanReardon/ToolkitExtraction

from Main import get_data, highlighted_text, comments
from AttributeIDList import clustering_output
import pandas as pd

# extract clustering data
clustering = get_data(clustering_output)
clustering_df = pd.DataFrame(clustering)
clustering_df = clustering_df.T
clustering_df.columns = ["clust_anal_raw"]

# Get Baseline Differences highlighted text
clustering_HT = highlighted_text(clustering_output)
clustering_HT_df = pd.DataFrame(clustering_HT)
clustering_HT_df = clustering_HT_df.T
clustering_HT_df.columns = ["clust_anal_ht"]

# Get Educational Setting user comments
clustering_Comments = comments(clustering_output)
clustering_Comments_df = pd.DataFrame(clustering_Comments)
clustering_Comments_df = clustering_Comments_df.T
clustering_Comments_df.columns = ["clust_anal_info"]

# concatenate data frames
clustering_df = pd.concat(
    [clustering_df, clustering_HT_df, clustering_Comments_df],
    axis=1,
    sort=False)

# fill blanks with NA
clustering_df.fillna("NA", inplace=True)

Exemplo n.º 11

0

Exibir arquivo

''' curriculumsubjects_df["test_subject_literacy_(first_language)"] = curriculumsubjects_df["test_subject_raw"].map(set(['Literacy (first language)']).issubset).astype(int)
curriculumsubjects_df["test_subject_reading_Comprehension"] = curriculumsubjects_df["test_subject_raw"].map(set(['Reading comprehension']).issubset).astype(int)
curriculumsubjects_df["test_subject_decoding/phonics"] = curriculumsubjects_df["test_subject_raw"].map(set(['Decoding/phonics']).issubset).astype(int)
curriculumsubjects_df["test_subject_spelling"] = curriculumsubjects_df["test_subject_raw"].map(set(['Spelling']).issubset).astype(int)
curriculumsubjects_df["test_subject_reading_other"] = curriculumsubjects_df["test_subject_raw"].map(set(['Reading other']).issubset).astype(int)
curriculumsubjects_df["test_subject_speaking_and_listening/oral_language"] = curriculumsubjects_df["test_subject_raw"].map(set(['Speaking and listening/Oral language']).issubset).astype(int)
curriculumsubjects_df["test_subject_writing"] = curriculumsubjects_df["test_subject_raw"].map(set(['Writing']).issubset).astype(int)
curriculumsubjects_df["test_subject_mathematics"] = curriculumsubjects_df["test_subject_raw"].map(set(['Mathematics']).issubset).astype(int)
curriculumsubjects_df["test_subject_science"] = curriculumsubjects_df["test_subject_raw"].map(set(['Science']).issubset).astype(int)
curriculumsubjects_df["test_subject_social_studies"] = curriculumsubjects_df["test_subject_raw"].map(set(['Social studies']).issubset).astype(int)
curriculumsubjects_df["test_subject_arts"] = curriculumsubjects_df["test_subject_raw"].map(set(['Arts']).issubset).astype(int)
curriculumsubjects_df["test_subject_languages"] = curriculumsubjects_df["test_subject_raw"].map(set(['Languages']).issubset).astype(int)
curriculumsubjects_df["test_subject_other_curriculum_test"] = curriculumsubjects_df["test_subject_raw"].map(set(['Other curriculum test']).issubset).astype(int) '''

# Get Country highlighted text
curriculumsubjects_HT = highlighted_text(curriculum_subjects)
curriculumsubjects_HT_df = pd.DataFrame(curriculumsubjects_HT)
curriculumsubjects_HT_df = curriculumsubjects_HT_df.T
curriculumsubjects_HT_df.columns = ["test_subject_ht"]

# Get Country user comments
curriculumsubjects_Comments = comments(curriculum_subjects)
curriculumsubjects_Comments_df = pd.DataFrame(curriculumsubjects_Comments)
curriculumsubjects_Comments_df = curriculumsubjects_Comments_df.T
curriculumsubjects_Comments_df.columns = ["test_subject_info"]

###########################
# OTHER OUTCOMES REPORTED #
###########################

# get other outcomes data

Exemplo n.º 12

0

Exibir arquivo

Arquivo: Sample_Size_Analyzed.py Projeto: JonathanReardon/ToolkitExtraction

from Main import load_json, comments, highlighted_text
from AttributeIDList import sample_size_analyzed_intervention_output
from AttributeIDList import sample_size_analyzed_control_output
from AttributeIDList import sample_size_analyzed_second_intervention_output
from AttributeIDList import sample_size_analyzed_second_control_output
import pandas as pd

# load json file
load_json()

#############################################
# Analyzed sample size for intervention group
#############################################

# highlighted text
sample_size_analyzed_intervention = highlighted_text(
    sample_size_analyzed_intervention_output)
sample_size_analyzed_intervention_df = pd.DataFrame(
    sample_size_analyzed_intervention)
sample_size_analyzed_intervention_df = sample_size_analyzed_intervention_df.T
sample_size_analyzed_intervention_df.columns = ["n_treat_ht"]

# comments
sample_size_analyzed_intervention_Comments = comments(
    sample_size_analyzed_intervention_output)
sample_size_analyzed_intervention_Comments_df = pd.DataFrame(
    sample_size_analyzed_intervention_Comments)
sample_size_analyzed_intervention_Comments_df = sample_size_analyzed_intervention_Comments_df.T
sample_size_analyzed_intervention_Comments_df.columns = ["n_treat_info"]

############################################
# Analyzed sample size for the control group

Exemplo n.º 13

0

Exibir arquivo

Arquivo: InterventionTime.py Projeto: JonathanReardon/ToolkitExtraction

# load json file
load_json()

###########################################
# DIGITAL TECHNOLOGY INTERVENTION INCLUSION
###########################################

# Get Intervention Time main data
InterventionTime = get_data(intervention_time_output)
InterventionTime_df = pd.DataFrame(InterventionTime)
InterventionTime_df = InterventionTime_df.T
InterventionTime_df.columns = ["int_when_raw"]

# Get Intervention Time highlighted text
InterventionTime_HT = highlighted_text(intervention_time_output)
InterventionTime_HT_df = pd.DataFrame(InterventionTime_HT)
InterventionTime_HT_df = InterventionTime_HT_df.T
InterventionTime_HT_df.columns = ["int_when_ht"]

# Get Intervention Time user comments
InterventionTime_Comments = comments(intervention_time_output)
InterventionTime_Comments_df = pd.DataFrame(InterventionTime_Comments)
InterventionTime_Comments_df = InterventionTime_Comments_df.T
InterventionTime_Comments_df.columns = ["int_when_info"]

# concatenate data frames
intervention_time_df = pd.concat([
    InterventionTime_df, InterventionTime_HT_df, InterventionTime_Comments_df
],
                                 axis=1,

Exemplo n.º 14

0

Exibir arquivo

from Main import load_json, get_data, comments, highlighted_text
from AttributeIDList import intervention_delivery_output
import pandas as pd

# load json file
load_json()

# get intervention delivery data
InterventionDelivery = get_data(intervention_delivery_output)
interventiondelivery_df = pd.DataFrame(InterventionDelivery)
interventiondelivery_df = interventiondelivery_df.T
interventiondelivery_df.columns = ["int_who_raw"]

# get intervention delivery highlighted text
InterventionDelivery_HT = highlighted_text(intervention_delivery_output)
InterventionDelivery_HT_df = pd.DataFrame(InterventionDelivery_HT)
InterventionDelivery_HT_df = InterventionDelivery_HT_df.T
InterventionDelivery_HT_df.columns = ["int_who_ht"]

# get intervention delivery user comments
InterventionDelivery_Comments = comments(intervention_delivery_output)
InterventionDelivery_Comments_df = pd.DataFrame(InterventionDelivery_Comments)
InterventionDelivery_Comments_df = InterventionDelivery_Comments_df.T
InterventionDelivery_Comments_df.columns = ["int_who_info"]

# concatenate data frames
intervention_delivery_df = pd.concat([
    interventiondelivery_df, 
    InterventionDelivery_HT_df, 
    InterventionDelivery_Comments_df
], axis=1, sort=False)

Exemplo n.º 15

0

Exibir arquivo

Arquivo: InterventionName.py Projeto: JonathanReardon/ToolkitExtraction

from Main import load_json, comments, highlighted_text
from AttributeIDList import intervention_name_output
import pandas as pd

# load json file
load_json()

# get intervention name highlighted text
Intervention_NameHT = highlighted_text(intervention_name_output)
Intervention_NameHT_df = pd.DataFrame(Intervention_NameHT)
Intervention_NameHT_df = Intervention_NameHT_df.T
Intervention_NameHT_df.columns=["int_name_ht"]

# get intervention name user comments
Intervention_Name_Comments = comments(intervention_name_output)
Intervention_Name_Comments_df = pd.DataFrame(Intervention_Name_Comments)
Intervention_Name_Comments_df = Intervention_Name_Comments_df.T
Intervention_Name_Comments_df.columns=["int_name_info"]

# concatenate dataframes
intervention_name_df = pd.concat([
    Intervention_NameHT_df, 
    Intervention_Name_Comments_df
], axis=1, sort=False)

# replace problematic text
intervention_name_df.replace('\r',' ', regex=True, inplace=True)
intervention_name_df.replace('\n',' ', regex=True, inplace=True)
intervention_name_df.replace(':',' ', regex=True, inplace=True)
intervention_name_df.replace(';',' ', regex=True, inplace=True)

Exemplo n.º 16

0

Exibir arquivo

Arquivo: PrimaryOutcomeDescStatsControlGroup_TWO.py Projeto: JonathanReardon/ToolkitExtraction

from AttributeIDList import control_group_two_posttest_sd
from AttributeIDList import control_group_two_gain_score_mean
from AttributeIDList import control_group_two_gain_score_sd
from AttributeIDList import control_group_two_any_other_info
from AttributeIDList import follow_up_data_reported
import pandas as pd

# load json file
load_json()

###########################
# CONTROL GROUP NUMBER
###########################

# Get Control Group Number highlighted text
ControlGroupNumber_HT = highlighted_text(control_group_two_number)
ControlGroupNumber_HT_df = pd.DataFrame(ControlGroupNumber_HT)
ControlGroupNumber_HT_df = ControlGroupNumber_HT_df.T
ControlGroupNumber_HT_df.columns = ["n_cont2_ht"]

# Get Control Group Number comments
ControlGroupNumber_comments = comments(control_group_two_number)
ControlGroupNumber_comments_df = pd.DataFrame(ControlGroupNumber_comments)
ControlGroupNumber_comments_df = ControlGroupNumber_comments_df.T
ControlGroupNumber_comments_df.columns = ["n_cont2_info"]

#################################
# Control GROUP PRE-TEST MEAN
#################################

# Get Control Group Pre-test Mean highlighted text

Exemplo n.º 17

0

Exibir arquivo

from Main import load_json, get_data, comments, highlighted_text
from AttributeIDList import intervention_costs_reported
import pandas as pd

# load json file
load_json()

# Get Intervention Costs Reported main data
InterventionCosts = get_data(intervention_costs_reported)
InterventionCosts_df = pd.DataFrame(InterventionCosts)
InterventionCosts_df = InterventionCosts_df.T
InterventionCosts_df.columns = ["int_cost_raw"]

# Get Intervention Costs Reported highlighted text
InterventionCosts_HT = highlighted_text(intervention_costs_reported)
InterventionCosts_HT_df = pd.DataFrame(InterventionCosts_HT)
InterventionCosts_HT_df = InterventionCosts_HT_df.T
InterventionCosts_HT_df.columns = ["int_cost_ht"]

# Get Intervention Costs Reported user comments
InterventionCosts_Comments = comments(intervention_costs_reported)
InterventionCosts_Comments_df = pd.DataFrame(InterventionCosts_Comments)
InterventionCosts_Comments_df = InterventionCosts_Comments_df.T
InterventionCosts_Comments_df.columns = ["int_cost_info"]

# concatenate data frames
intervention_costs_df = pd.concat([
    InterventionCosts_df, InterventionCosts_HT_df,
    InterventionCosts_Comments_df
],
                                  axis=1,

Exemplo n.º 18

0

Exibir arquivo

from Main import load_json, get_data, comments, highlighted_text
from AttributeIDList import treatment_group
import pandas as pd

# load json file
load_json()

# get treatment group data
treatmentgroup = get_data(treatment_group)
treatmentgroup_df = pd.DataFrame(treatmentgroup)
treatmentgroup_df = treatmentgroup_df.T
treatmentgroup_df.columns = ["treat_group_raw"]

# get treatment group highlighted text
treatmentgroup_HT = highlighted_text(treatment_group)
treatmentgroup_HT_df = pd.DataFrame(treatmentgroup_HT)
treatmentgroup_HT_df = treatmentgroup_HT_df.T
treatmentgroup_HT_df.columns = ["treat_group_ht"]

# get treatment group user comments
treatmentgroup_Comments = comments(treatment_group)
treatmentgroup_Comments_df = pd.DataFrame(treatmentgroup_Comments)
treatmentgroup_Comments_df = treatmentgroup_Comments_df.T
treatmentgroup_Comments_df.columns = ["treat_group_info"]

# concatenate data frames
treatment_group_df = pd.concat(
    [treatmentgroup_df, treatmentgroup_HT_df, treatmentgroup_Comments_df],
    axis=1,
    sort=False)

Exemplo n.º 19

0

Exibir arquivo

Arquivo: PrimaryOutcomeDescStatsInterventionGroup.py Projeto: JonathanReardon/ToolkitExtraction

from AttributeIDList import intervention_group_posttest_mean
from AttributeIDList import intervention_group_posttest_sd
from AttributeIDList import intervention_group_gain_score_mean
from AttributeIDList import intervention_group_gain_score_sd
from AttributeIDList import intervention_group_any_other_info
import pandas as pd

# load json file
load_json()

###########################
# INTERVENTION GROUP NUMBER
###########################

# Get Intervention Group Number highlighted text
InterventionGroupNumber_HT = highlighted_text(intervention_group_number)
InterventionGroupNumber_HT_df = pd.DataFrame(InterventionGroupNumber_HT)
InterventionGroupNumber_HT_df = InterventionGroupNumber_HT_df.T
InterventionGroupNumber_HT_df.columns = ["n_treat_ht"]

# Get Intervention Group Number comments
InterventionGroupNumber_comments = comments(intervention_group_number)
InterventionGroupNumber_comments_df = pd.DataFrame(
    InterventionGroupNumber_comments)
InterventionGroupNumber_comments_df = InterventionGroupNumber_comments_df.T
InterventionGroupNumber_comments_df.columns = ["n_treat_info"]

##################################
# INTERVENTION GROUP PRE-TEST MEAN
##################################

Exemplo n.º 20

0

Exibir arquivo

# load json file
load_json()

###########################################
# DIGITAL TECHNOLOGY INTERVENTION INCLUSION
###########################################

# Get Digital Technology (inclusion) main data
DigitalTechnology = get_data(intervention_approach_digital_technology)
DigitalTechnology_df = pd.DataFrame(DigitalTechnology)
DigitalTechnology_df = DigitalTechnology_df.T
DigitalTechnology_df.columns = ["digit_tech_raw"]

# Get Digital Technology (inclusion) highlighted text
DigitalTechnology_HT = highlighted_text(
    intervention_approach_digital_technology)
DigitalTechnology_HT_df = pd.DataFrame(DigitalTechnology_HT)
DigitalTechnology_HT_df = DigitalTechnology_HT_df.T
DigitalTechnology_HT_df.columns = ["digit_tech_ht"]

# Get Digital Technology (inclusion) user comments
DigitalTechnology_Comments = comments(intervention_approach_digital_technology)
DigitalTechnology_Comments_df = pd.DataFrame(DigitalTechnology_Comments)
DigitalTechnology_Comments_df = DigitalTechnology_Comments_df.T
DigitalTechnology_Comments_df.columns = ["digit_tech_info"]

###########################################
# PARENTS OR COMMUNITY VOLUNTEERS INCLUSION
###########################################

# Get Parents/Community volunteers (inclusion) main data

Exemplo n.º 21

0

Exibir arquivo

from Main import load_json, get_data, comments, highlighted_text
from AttributeIDList import intervention_teaching_approach
import pandas as pd

# load json file
load_json()

# get intervention teaching approach data
InterventionTeachingApproach = get_data(intervention_teaching_approach)
InterventionTeachingApproach_df = pd.DataFrame(InterventionTeachingApproach)
InterventionTeachingApproach_df = InterventionTeachingApproach_df.T
InterventionTeachingApproach_df.columns = ["int_approach_raw"]

# get intervention teaching approach highlighted text
InterventionTeachingApproach_HT = highlighted_text(intervention_teaching_approach)
InterventionTeachingApproach_HT_df = pd.DataFrame(InterventionTeachingApproach_HT)
InterventionTeachingApproach_HT_df = InterventionTeachingApproach_HT_df.T
InterventionTeachingApproach_HT_df.columns = ["int_approach_ht"]

# get intervention teaching approach user comments
InterventionTeachingApproach_Comments = comments(intervention_teaching_approach)
InterventionTeachingApproach_Comments_df = pd.DataFrame(InterventionTeachingApproach_Comments)
InterventionTeachingApproach_Comments_df = InterventionTeachingApproach_Comments_df.T
InterventionTeachingApproach_Comments_df.columns = ["int_approach_info"]

# concatenate data frames
intervention_teaching_approach_df = pd.concat([
    InterventionTeachingApproach_df, 
    InterventionTeachingApproach_HT_df, 
    InterventionTeachingApproach_Comments_df
], axis=1, sort=False)

Exemplo n.º 22

0

Exibir arquivo

    "Syrian Arab Republic", "Congo, Dem. Rep", "Malawi", "Tajikistan",
    "Eritrea", "Mali", "Togo"
    "Ethiopia", "Mozambique", "Uganda"
    "Gambia, The", "Niger", "Yemen, Rep.", "Guinea", "Rwanda"
]

##############################################

# get country data
country = get_data(countries)
country_df = pd.DataFrame(country)
country_df = country_df.T
country_df.columns = ["loc_country_raw"]

# get country highlighted text
country_HT = highlighted_text(countries)
country_HT_df = pd.DataFrame(country_HT)
country_HT_df = country_HT_df.T
country_HT_df.columns = ["loc_country_ht"]

# get country user comments
country_Comments = comments(countries)
country_Comments_df = pd.DataFrame(country_Comments)
country_Comments_df = country_Comments_df.T
country_Comments_df.columns = ["loc_country_info"]

# concatenate data frames
""" country_df = pd.concat(
    [country_df, country_HT_df, country_Comments_df], axis=1, sort=False) """

# fill blanks with NA

Exemplo n.º 23

0

Exibir arquivo

from Main import load_json, comments, highlighted_text
from AttributeIDList import intervention_frequency_output
import pandas as pd

# load json file
load_json()

# get intervention frequency highlighted text
InterventionFrequency_HT = highlighted_text(intervention_frequency_output)
InterventionFrequency_HT_df = pd.DataFrame(InterventionFrequency_HT)
InterventionFrequency_HT_df = InterventionFrequency_HT_df.T
InterventionFrequency_HT_df.columns = ["int_freq_ht"]

# get intervention frequency user comments
InterventionFrequency_Comments = comments(intervention_frequency_output)
InterventionFrequency_Comments_df = pd.DataFrame(
    InterventionFrequency_Comments)
InterventionFrequency_Comments_df = InterventionFrequency_Comments_df.T
InterventionFrequency_Comments_df.columns = ["int_freq_info"]

# concatenate data frames
intervention_frequency_df = pd.concat(
    [InterventionFrequency_HT_df, InterventionFrequency_Comments_df],
    axis=1,
    sort=False)

# Remove problematic text (potential escape sequences) from text input
intervention_frequency_df.replace('\r', ' ', regex=True, inplace=True)
intervention_frequency_df.replace('\n', ' ', regex=True, inplace=True)
intervention_frequency_df.replace(':', ' ', regex=True, inplace=True)
intervention_frequency_df.replace(';', ' ', regex=True, inplace=True)

Exemplo n.º 24

0

Exibir arquivo

Arquivo: Baseline_Differences.py Projeto: JonathanReardon/ToolkitExtraction

from Main import get_data, highlighted_text, comments
from AttributeIDList import baseline_differences_output
import pandas as pd

# extract baseline differences data
baselinedifferences = get_data(baseline_differences_output)
baselinedifferences_df = pd.DataFrame(baselinedifferences)
baselinedifferences_df = baselinedifferences_df.T
baselinedifferences_df.columns=["base_diff_raw"]

# Get Baseline Differences highlighted text
baselinedifferences_HT = highlighted_text(baseline_differences_output)
baselinedifferences_HT_df = pd.DataFrame(baselinedifferences_HT)
baselinedifferences_HT_df = baselinedifferences_HT_df.T
baselinedifferences_HT_df.columns = ["base_diff_ht"]

# Get Educational Setting user comments
baselinedifferences_Comments = comments(baseline_differences_output)
baselinedifferences_Comments_df = pd.DataFrame(baselinedifferences_Comments)
baselinedifferences_Comments_df = baselinedifferences_Comments_df.T
baselinedifferences_Comments_df.columns = ["base_diff_info"]

# concatenate data frames
baseline_differences_df = pd.concat([
    baselinedifferences_df, 
    baselinedifferences_HT_df, 
    baselinedifferences_Comments_df
], axis=1, sort=False)

# fill blanks with NA
baseline_differences_df.fillna("NA", inplace=True)

Exemplo n.º 25

0

Exibir arquivo

Arquivo: GenderSplit.py Projeto: JonathanReardon/ToolkitExtraction

from Main import highlighted_text, comments
from AttributeIDList import gender_split_output
import pandas as pd
 
# get gender split data
gender_split = comments(gender_split_output)
gender_split_df = pd.DataFrame(gender_split)
gender_split_df = gender_split_df.T
gender_split_df.columns = ["Gender_Split_comments"]

# get gender split highlighted text
gender_split_comments = highlighted_text(gender_split_output)
gender_split_comments_df = pd.DataFrame(gender_split_comments)
gender_split_comments_df = gender_split_comments_df.T
gender_split_comments_df.columns = ["Gender_Split_HT"]

# concatenate all dataframes
gender_split_df = pd.concat([gender_split_df, gender_split_comments_df], axis=1, sort=False)

# remove problematic text
gender_split_df.replace('\r',' ', regex=True, inplace=True)
gender_split_df.replace('\n',' ', regex=True, inplace=True)

# fill blanks with NA
gender_split_df.fillna("NA", inplace=True)

# save to disk
gender_split_df.to_csv("gender_split.csv", index=False)

Exemplo n.º 26

0

Exibir arquivo

Arquivo: PrimaryOutcomeDescStatsControlGroup.py Projeto: JonathanReardon/ToolkitExtraction

from AttributeIDList import control_group_posttest_sd
from AttributeIDList import control_group_gain_score_mean
from AttributeIDList import control_group_gain_score_sd
from AttributeIDList import control_group_any_other_info
from AttributeIDList import follow_up_data_reported
import pandas as pd

# load json file
load_json()

###########################
# CONTROL GROUP NUMBER
###########################

# Get Control Group Number highlighted text
ControlGroupNumber_HT = highlighted_text(control_group_number)
ControlGroupNumber_HT_df = pd.DataFrame(ControlGroupNumber_HT)
ControlGroupNumber_HT_df = ControlGroupNumber_HT_df.T
ControlGroupNumber_HT_df.columns = ["n_cont_ht"]

# Get Control Group Number comments
ControlGroupNumber_comments = comments(control_group_number)
ControlGroupNumber_comments_df = pd.DataFrame(ControlGroupNumber_comments)
ControlGroupNumber_comments_df = ControlGroupNumber_comments_df.T
ControlGroupNumber_comments_df.columns = ["n_cont_info"]

#################################
# Control GROUP PRE-TEST MEAN
#################################

# Get Control Group Pre-test Mean highlighted text

Exemplo n.º 27

0

Exibir arquivo

Arquivo: InterventionObjectives.py Projeto: JonathanReardon/ToolkitExtraction

from Main import load_json, comments, highlighted_text
from AttributeIDList import intervention_objectives_output
import pandas as pd

# load json file
load_json()

# Get Intervention Name highlighted text
Intervention_ObjectivesHT = highlighted_text(intervention_objectives_output)
Intervention_ObjectivesHT_df = pd.DataFrame(Intervention_ObjectivesHT)
Intervention_ObjectivesHT_df = Intervention_ObjectivesHT_df.T
Intervention_ObjectivesHT_df.columns = ["int_objec_ht"]

# Get Intervention Description user comments
Intervention_Objectives_Comments = comments(intervention_objectives_output)
Intervention_Objectives_Comments_df = pd.DataFrame(
    Intervention_Objectives_Comments)
Intervention_Objectives_Comments_df = Intervention_Objectives_Comments_df.T
Intervention_Objectives_Comments_df.columns = ["int_objec_info"]

# concatenate data frames
intervention_objectives_df = pd.concat(
    [Intervention_ObjectivesHT_df, Intervention_Objectives_Comments_df],
    axis=1,
    sort=False)

# remove problematic text
intervention_objectives_df.replace('\r', ' ', regex=True, inplace=True)
intervention_objectives_df.replace('\n', ' ', regex=True, inplace=True)
intervention_objectives_df.replace(':', ' ', regex=True, inplace=True)
intervention_objectives_df.replace(';', ' ', regex=True, inplace=True)

Exemplo n.º 28

0

Exibir arquivo

# load json file
load_json()

#################
# Other outcomes
#################

# get other outcomes data
other_outcomes = get_data(other_outcomes_output)
other_outcomes_df = pd.DataFrame(other_outcomes)
other_outcomes_df = other_outcomes_df.T
other_outcomes_df.columns = ["out_other_raw"]

# get other outcomes highlighted text
other_outcomes_HT = highlighted_text(other_outcomes_output)
other_outcomes_HT_df = pd.DataFrame(other_outcomes_HT)
other_outcomes_HT_df = other_outcomes_HT_df.T
other_outcomes_HT_df.columns = ["out_other_ht"]

# get other outcomes comments
other_outcomes_info = comments(other_outcomes_output)
other_outcomes_info_df = pd.DataFrame(other_outcomes_info)
other_outcomes_info_df = other_outcomes_info_df.T
other_outcomes_info_df.columns = ["out_other_info"]

######################
# Additional outcomes
######################

# get additional outcomes data

Exemplo n.º 29

0

Exibir arquivo

from Main import load_json, get_data, comments, highlighted_text
from AttributeIDList import intervention_organisation_type_output
import pandas as pd

# load json file
load_json()

# get intervention organisation type main data
InterventionOrgType = get_data(intervention_organisation_type_output)
InterventionOrgType_df = pd.DataFrame(InterventionOrgType)
InterventionOrgType_df = InterventionOrgType_df.T
InterventionOrgType_df.columns = ["int_prov_raw"]

# get intervention organisation type highlighted text
InterventionOrgType_HT = highlighted_text(
    intervention_organisation_type_output)
InterventionOrgType_HT_df = pd.DataFrame(InterventionOrgType_HT)
InterventionOrgType_HT_df = InterventionOrgType_HT_df.T
InterventionOrgType_HT_df.columns = ["int_prov_ht"]

# get intervention organisation type user comments
InterventionOrgType_Comments = comments(intervention_organisation_type_output)
InterventionOrgType_Comments_df = pd.DataFrame(InterventionOrgType_Comments)
InterventionOrgType_Comments_df = InterventionOrgType_Comments_df.T
InterventionOrgType_Comments_df.columns = ["int_prov_info"]

# concatenate data frames
intervention_org_type = pd.concat([
    InterventionOrgType_df, InterventionOrgType_HT_df,
    InterventionOrgType_Comments_df
],

Exemplo n.º 30

0

Exibir arquivo

load_json()

# get intervention costs reported main data
InterventionEvaluation = get_data(intervention_evaluation)
InterventionEvaluation_df = pd.DataFrame(InterventionEvaluation)
InterventionEvaluation_df = InterventionEvaluation_df.T
InterventionEvaluation_df.columns = ["out_eval_raw"]

InterventionEvaluation_df["eef_eval_raw"] = InterventionEvaluation_df[
    "out_eval_raw"].map(set(["Is this an EEF evaluation?"
                             ]).issubset).astype(int)
InterventionEvaluation_df["eef_eval_raw"] = InterventionEvaluation_df[
    "eef_eval_raw"].replace(to_replace=[0, 1], value=["No", "Yes"])

# get intervention costs reported highlighted text
InterventionEvaluation_HT = highlighted_text(intervention_evaluation)
InterventionEvaluation_HT_df = pd.DataFrame(InterventionEvaluation_HT)
InterventionEvaluation_HT_df = InterventionEvaluation_HT_df.T
InterventionEvaluation_HT_df.columns = ["out_eval_ht"]

# get intervention costs reported user comments
InterventionEvaluation_Comments = comments(intervention_evaluation)
InterventionEvaluation_Comments_df = pd.DataFrame(
    InterventionEvaluation_Comments)
InterventionEvaluation_Comments_df = InterventionEvaluation_Comments_df.T
InterventionEvaluation_Comments_df.columns = ["out_eval_info"]

# concatenate data frames
intervention_evaluation_df = pd.concat([
    InterventionEvaluation_df, InterventionEvaluation_HT_df,
    InterventionEvaluation_Comments_df