Source code for ecoli.analysis.multivariant.dummy

from typing import Any

from duckdb import DuckDBPyConnection

OUTPUT_COLUMN_NAMES: set[str] = {
    "agent_id",
    "bulk",
    "experiment_id",
    "generation",
    "lineage_seed",
    "listeners__atp__atp_allocated_initial",
    "listeners__atp__atp_requested",
    "listeners__complexation_listener__complexation_events",
    "listeners__dna_supercoiling__segment_domain_indexes",
    "listeners__dna_supercoiling__segment_left_boundary_coordinates",
    "listeners__dna_supercoiling__segment_right_boundary_coordinates",
    "listeners__dna_supercoiling__segment_superhelical_densities",
    "listeners__enzyme_kinetics__actual_fluxes",
    "listeners__enzyme_kinetics__counts_to_molar",
    "listeners__enzyme_kinetics__enzyme_counts_init",
    "listeners__enzyme_kinetics__metabolite_counts_final",
    "listeners__enzyme_kinetics__metabolite_counts_init",
    "listeners__enzyme_kinetics__target_aa_conc",
    "listeners__enzyme_kinetics__target_fluxes",
    "listeners__enzyme_kinetics__target_fluxes_lower",
    "listeners__enzyme_kinetics__target_fluxes_upper",
    "listeners__equilibrium_listener__reaction_rates",
    "listeners__fba_results__base_reaction_fluxes",
    "listeners__fba_results__catalyst_counts",
    "listeners__fba_results__coefficient",
    "listeners__fba_results__conc_updates",
    "listeners__fba_results__constrained_molecules",
    "listeners__fba_results__delta_metabolites",
    "listeners__fba_results__external_exchange_fluxes",
    "listeners__fba_results__homeostatic_objective_values",
    "listeners__fba_results__kinetic_objective_values",
    "listeners__fba_results__media_id",
    "listeners__fba_results__objective_value",
    "listeners__fba_results__reaction_fluxes",
    "listeners__fba_results__reduced_costs",
    "listeners__fba_results__shadow_prices",
    "listeners__fba_results__target_concentrations",
    "listeners__fba_results__translation_gtp",
    "listeners__fba_results__unconstrained_molecules",
    "listeners__fba_results__uptake_constraints",
    "listeners__growth_limits__aa_allocated",
    "listeners__growth_limits__aa_conc",
    "listeners__growth_limits__aa_count_diff",
    "listeners__growth_limits__aa_export",
    "listeners__growth_limits__aa_exporters",
    "listeners__growth_limits__aa_import",
    "listeners__growth_limits__aa_importers",
    "listeners__growth_limits__aa_in_media",
    "listeners__growth_limits__aa_pool_size",
    "listeners__growth_limits__aa_request_size",
    "listeners__growth_limits__aa_supply",
    "listeners__growth_limits__aa_supply_aa_conc",
    "listeners__growth_limits__aa_supply_enzymes_fwd",
    "listeners__growth_limits__aa_supply_enzymes_rev",
    "listeners__growth_limits__aa_supply_fraction_fwd",
    "listeners__growth_limits__aa_supply_fraction_rev",
    "listeners__growth_limits__aa_synthesis",
    "listeners__growth_limits__aas_used",
    "listeners__growth_limits__active_ribosome_allocated",
    "listeners__growth_limits__charged_trna_conc",
    "listeners__growth_limits__fraction_aa_to_elongate",
    "listeners__growth_limits__fraction_trna_charged",
    "listeners__growth_limits__net_charged",
    "listeners__growth_limits__ntp_allocated",
    "listeners__growth_limits__ntp_pool_size",
    "listeners__growth_limits__ntp_request_size",
    "listeners__growth_limits__ntp_used",
    "listeners__growth_limits__original_aa_supply",
    "listeners__growth_limits__ppgpp_conc",
    "listeners__growth_limits__rela_conc",
    "listeners__growth_limits__rela_syn",
    "listeners__growth_limits__ribosome_conc",
    "listeners__growth_limits__spot_conc",
    "listeners__growth_limits__spot_deg",
    "listeners__growth_limits__spot_deg_inhibited",
    "listeners__growth_limits__spot_syn",
    "listeners__growth_limits__synthetase_conc",
    "listeners__growth_limits__trna_charged",
    "listeners__growth_limits__uncharged_trna_conc",
    "listeners__mass__cell_mass",
    "listeners__mass__cytosol_mass",
    "listeners__mass__dna_mass",
    "listeners__mass__dry_mass",
    "listeners__mass__dry_mass_fold_change",
    "listeners__mass__expected_mass_fold_change",
    "listeners__mass__extracellular_mass",
    "listeners__mass__flagellum_mass",
    "listeners__mass__growth",
    "listeners__mass__inner_membrane_mass",
    "listeners__mass__instantaneous_growth_rate",
    "listeners__mass__mRna_mass",
    "listeners__mass__membrane_mass",
    "listeners__mass__outer_membrane_mass",
    "listeners__mass__periplasm_mass",
    "listeners__mass__pilus_mass",
    "listeners__mass__projection_mass",
    "listeners__mass__protein_mass",
    "listeners__mass__protein_mass_fold_change",
    "listeners__mass__protein_mass_fraction",
    "listeners__mass__rRna_mass",
    "listeners__mass__rna_mass",
    "listeners__mass__rna_mass_fold_change",
    "listeners__mass__rna_mass_fraction",
    "listeners__mass__smallMolecule_mass",
    "listeners__mass__small_molecule_fold_change",
    "listeners__mass__tRna_mass",
    "listeners__mass__volume",
    "listeners__mass__water_mass",
    "listeners__monomer_counts",
    "listeners__replication_data__critical_initiation_mass",
    "listeners__replication_data__critical_mass_per_oriC",
    "listeners__replication_data__fork_coordinates",
    "listeners__replication_data__fork_domains",
    "listeners__replication_data__fork_unique_index",
    "listeners__replication_data__free_DnaA_boxes",
    "listeners__replication_data__number_of_oric",
    "listeners__replication_data__total_DnaA_boxes",
    "listeners__ribosome_data__aa_count_in_sequence",
    "listeners__ribosome_data__aa_counts",
    "listeners__ribosome_data__actual_elongation_hist",
    "listeners__ribosome_data__actual_elongations",
    "listeners__ribosome_data__actual_prob_translation_per_transcript",
    "listeners__ribosome_data__did_initialize",
    "listeners__ribosome_data__did_terminate",
    "listeners__ribosome_data__effective_elongation_rate",
    "listeners__ribosome_data__elongations_non_terminating_hist",
    "listeners__ribosome_data__mRNA_TU_index",
    "listeners__ribosome_data__mRNA_is_overcrowded",
    "listeners__ribosome_data__max_p",
    "listeners__ribosome_data__max_p_per_protein",
    "listeners__ribosome_data__n_ribosomes_on_each_mRNA",
    "listeners__ribosome_data__n_ribosomes_on_partial_mRNA_per_transcript",
    "listeners__ribosome_data__n_ribosomes_per_transcript",
    "listeners__ribosome_data__num_trpA_terminated",
    "listeners__ribosome_data__process_elongation_rate",
    "listeners__ribosome_data__protein_mass_on_polysomes",
    "listeners__ribosome_data__rRNA16S_init_prob",
    "listeners__ribosome_data__rRNA16S_initiated",
    "listeners__ribosome_data__rRNA23S_init_prob",
    "listeners__ribosome_data__rRNA23S_initiated",
    "listeners__ribosome_data__rRNA5S_init_prob",
    "listeners__ribosome_data__rRNA5S_initiated",
    "listeners__ribosome_data__rRNA_init_prob_TU",
    "listeners__ribosome_data__rRNA_initiated_TU",
    "listeners__ribosome_data__ribosome_init_event_per_monomer",
    "listeners__ribosome_data__target_prob_translation_per_transcript",
    "listeners__ribosome_data__termination_loss",
    "listeners__ribosome_data__total_rRNA_init_prob",
    "listeners__ribosome_data__total_rRNA_initiated",
    "listeners__ribosome_data__total_rna_init",
    "listeners__ribosome_data__translation_supply",
    "listeners__rna_counts__full_mRNA_cistron_counts",
    "listeners__rna_counts__full_mRNA_counts",
    "listeners__rna_counts__mRNA_cistron_counts",
    "listeners__rna_counts__mRNA_counts",
    "listeners__rna_counts__partial_mRNA_cistron_counts",
    "listeners__rna_counts__partial_mRNA_counts",
    "listeners__rna_counts__partial_rRNA_cistron_counts",
    "listeners__rna_counts__partial_rRNA_counts",
    "listeners__rna_degradation_listener__count_RNA_degraded_per_cistron",
    "listeners__rna_degradation_listener__count_rna_degraded",
    "listeners__rna_degradation_listener__diff_relative_first_order_decay",
    "listeners__rna_degradation_listener__fract_endo_rrna_counts",
    "listeners__rna_degradation_listener__fraction_active_endornases",
    "listeners__rna_degradation_listener__fragment_bases_digested",
    "listeners__rna_degradation_listener__nucleotides_from_degradation",
    "listeners__rna_maturation_listener__maturation_enzyme_counts",
    "listeners__rna_maturation_listener__mature_rnas_generated",
    "listeners__rna_maturation_listener__total_degraded_ntps",
    "listeners__rna_maturation_listener__total_maturation_events",
    "listeners__rna_maturation_listener__unprocessed_rnas_consumed",
    "listeners__rna_synth_prob__actual_rna_synth_prob",
    "listeners__rna_synth_prob__actual_rna_synth_prob_per_cistron",
    "listeners__rna_synth_prob__bound_TF_coordinates",
    "listeners__rna_synth_prob__bound_TF_domains",
    "listeners__rna_synth_prob__bound_TF_indexes",
    "listeners__rna_synth_prob__expected_rna_init_per_cistron",
    "listeners__rna_synth_prob__gene_copy_number",
    "listeners__rna_synth_prob__max_p",
    "listeners__rna_synth_prob__n_actual_bound",
    "listeners__rna_synth_prob__n_available_promoters",
    "listeners__rna_synth_prob__n_bound_TF_per_TU",
    "listeners__rna_synth_prob__n_bound_TF_per_cistron",
    "listeners__rna_synth_prob__n_promoter_bound",
    "listeners__rna_synth_prob__p_promoter_bound",
    "listeners__rna_synth_prob__promoter_copy_number",
    "listeners__rna_synth_prob__target_rna_synth_prob",
    "listeners__rna_synth_prob__target_rna_synth_prob_per_cistron",
    "listeners__rna_synth_prob__total_rna_init",
    "listeners__rna_synth_prob__tu_is_overcrowded",
    "listeners__rnap_data__active_rnap_coordinates",
    "listeners__rnap_data__active_rnap_domain_indexes",
    "listeners__rnap_data__active_rnap_n_bound_ribosomes",
    "listeners__rnap_data__active_rnap_on_stable_RNA_indexes",
    "listeners__rnap_data__active_rnap_unique_indexes",
    "listeners__rnap_data__actual_elongations",
    "listeners__rnap_data__codirectional_collision_coordinates",
    "listeners__rnap_data__did_initialize",
    "listeners__rnap_data__did_stall",
    "listeners__rnap_data__did_terminate",
    "listeners__rnap_data__empty_fork_collision_coordinates",
    "listeners__rnap_data__headon_collision_coordinates",
    "listeners__rnap_data__incomplete_transcription_events",
    "listeners__rnap_data__n_codirectional_collisions",
    "listeners__rnap_data__n_empty_fork_collisions",
    "listeners__rnap_data__n_headon_collisions",
    "listeners__rnap_data__n_removed_ribosomes",
    "listeners__rnap_data__n_total_collisions",
    "listeners__rnap_data__rna_init_event",
    "listeners__rnap_data__rna_init_event_per_cistron",
    "listeners__rnap_data__termination_loss",
    "listeners__transcript_elongation_listener__attenuation_probability",
    "listeners__transcript_elongation_listener__count_NTPs_used",
    "listeners__transcript_elongation_listener__count_rna_synthesized",
    "listeners__transcript_elongation_listener__counts_attenuated",
    "listeners__unique_molecule_counts__DnaA_box",
    "listeners__unique_molecule_counts__RNA",
    "listeners__unique_molecule_counts__active_RNAP",
    "listeners__unique_molecule_counts__active_replisome",
    "listeners__unique_molecule_counts__active_ribosome",
    "listeners__unique_molecule_counts__chromosomal_segment",
    "listeners__unique_molecule_counts__chromosome_domain",
    "listeners__unique_molecule_counts__full_chromosome",
    "listeners__unique_molecule_counts__gene",
    "listeners__unique_molecule_counts__oriC",
    "listeners__unique_molecule_counts__promoter",
    "process_state__polypeptide_elongation__aa_count_diff__ARG[c]",
    "process_state__polypeptide_elongation__aa_count_diff__ASN[c]",
    "process_state__polypeptide_elongation__aa_count_diff__CYS[c]",
    "process_state__polypeptide_elongation__aa_count_diff__GLN[c]",
    "process_state__polypeptide_elongation__aa_count_diff__GLT[c]",
    "process_state__polypeptide_elongation__aa_count_diff__GLY[c]",
    "process_state__polypeptide_elongation__aa_count_diff__HIS[c]",
    "process_state__polypeptide_elongation__aa_count_diff__ILE[c]",
    "process_state__polypeptide_elongation__aa_count_diff__L-ALPHA-ALANINE[c]",
    "process_state__polypeptide_elongation__aa_count_diff__L-ASPARTATE[c]",
    "process_state__polypeptide_elongation__aa_count_diff__L-SELENOCYSTEINE[c]",
    "process_state__polypeptide_elongation__aa_count_diff__LEU[c]",
    "process_state__polypeptide_elongation__aa_count_diff__LYS[c]",
    "process_state__polypeptide_elongation__aa_count_diff__MET[c]",
    "process_state__polypeptide_elongation__aa_count_diff__PHE[c]",
    "process_state__polypeptide_elongation__aa_count_diff__PRO[c]",
    "process_state__polypeptide_elongation__aa_count_diff__SER[c]",
    "process_state__polypeptide_elongation__aa_count_diff__THR[c]",
    "process_state__polypeptide_elongation__aa_count_diff__TRP[c]",
    "process_state__polypeptide_elongation__aa_count_diff__TYR[c]",
    "process_state__polypeptide_elongation__aa_count_diff__VAL[c]",
    "process_state__polypeptide_elongation__aa_exchange_rates",
    "process_state__polypeptide_elongation__gtp_to_hydrolyze",
    "time",
    "variant",
}


[docs] def plot( params: dict[str, Any], conn: DuckDBPyConnection, history_sql: str, config_sql: str, success_sql: str, sim_data_paths: dict[str, dict[int, str]], validation_data_paths: list[str], outdir: str, variant_metadata: dict[str, dict[int, Any]], variant_names: dict[str, str], ): """ Dummy analysis script that checks current output columns match expected list of output columns. """ current_column_names = conn.sql( f"SELECT column_name FROM (DESCRIBE ({history_sql})) ORDER BY column_name" ).pl() current_column_names = set(current_column_names["column_name"].to_list()) if current_column_names != OUTPUT_COLUMN_NAMES: missing_columns = OUTPUT_COLUMN_NAMES - current_column_names new_columns = current_column_names - OUTPUT_COLUMN_NAMES error_msg = [ "Output column names mismatch detected!\n", "This could be due to:\n", " 1. New output columns have been added to the simulation\n", " 2. Existing output columns have been renamed\n", " 3. Columns have been removed from the simulation\n", ] if new_columns: error_msg.append("\nNew columns (not in expected list):") error_msg.extend([f" • {col}" for col in sorted(new_columns)]) if missing_columns: error_msg.append("\nMissing columns (expected but not found):") error_msg.extend([f" • {col}" for col in sorted(missing_columns)]) error_msg.append("\nTroubleshooting:") error_msg.append( " • If new columns were added: Add them to OUTPUT_COLUMN_NAMES" ) error_msg.append( " • If columns were renamed: Update names in OUTPUT_COLUMN_NAMES" ) error_msg.append( " • If columns were removed: Remove names in OUTPUT_COLUMN_NAMES" ) error_msg.append( " • IMPORTANT: update other analyses that use renamed or removed columns" ) raise RuntimeError("\n".join(error_msg)) with open(f"{outdir}/dummy_analysis.txt", "w") as f: f.write("Dummy analysis completed successfully.\n") f.write("No issues detected with output column names.\n")