4 Markers analyse

Code

#pkg
library(Seurat)
library(SoupX)
library(scDblFinder)
library(Matrix)
library(rtracklayer)
library(GenomeInfoDb)
library(tidyverse)
library(forcats)
library(ggplot2)
library(here)
library(tidyverse)
library(readxl)
library(gt)
library(paletteer)
library(scales)
library(DT)
library(htmlwidgets)
library(rtracklayer)
library(fs)
library(glmGamPoi)
library(furrr)
library(future)
library(googlesheets4)
library(DT)
library(janitor)
library(biomaRt)

library(readr)
library(stringr)
library(tidyr)
library(GenomicRanges)
library(GO.db)
library(AnnotationDbi)
library(patchwork) 

if (requireNamespace("glmGamPoi", quietly = TRUE)) message("glmGamPoi available: SCT will be faster.")
if (requireNamespace("presto", quietly = TRUE)) message("presto available: marker finding will be faster.")

# src
source(here::here("src/function/stat_function/stat_analysis_main.R")) # for make plot 
source(here::here("src/function/fig_export.R")) # This function saves a given plot (plot_x) as both a PDF and a high-resolution PNG file at specified dimensions.

runs_base <- "/mnt/ibioldata/LBMC_data/cmaslard/data/ScBdLR_init_2025_private/cellranger/"
#runs_base <- "/Volumes/IBIOLdata_storage/LBMC_data/cmaslard/data/ScBdLR_init_2025_private/cellranger/"

# ---- 0) Pick a GTF (prefer organelle ref, fallback to nuclear) ----
gtf_candidates <- c(
  here::here("data/refs/BdistachyonBd21_3_10X_Genome_organelle/genes/genes.gtf.gz"),
  here::here("data/refs/BdistachyonBd21_3_10X_Genome/genes/genes.gtf.gz")
)
gtf_file <- gtf_candidates[file.exists(gtf_candidates)][1]
message("Using GTF: ", gtf_file)
gtf <- rtracklayer::import(gtf_file)

obj_dir <- here("data/output/snrnaseq_objects")
obj_all <- readRDS(file.path(obj_dir, "obj_all_SCT_PCA_UMAP_clusters.rds"))

4.1 Find the top ones for some clusers

Code

DefaultAssay(obj_all) <- "SCT"
Idents(obj_all)       <- obj_all$seurat_clusters

# Prepare SCT models for marker testing (needed once per object)
obj_all <- PrepSCTFindMarkers(obj_all)

# Example: markers for clusters 6 and 2 against all other cells
markers_cl6 <- FindMarkers(
  obj_all,
  ident.1         = "6",
  assay           = "SCT",
  slot            = "data",
  logfc.threshold = 0.25,
  min.pct         = 0.1
)

markers_cl2 <- FindMarkers(
  obj_all,
  ident.1         = "2",
  assay           = "SCT",
  slot            = "data",
  logfc.threshold = 0.25,
  min.pct         = 0.1
)

markers_cl9 <- FindMarkers(
  obj_all,
  ident.1         = "9",
  assay           = "SCT",
  slot            = "data",
  logfc.threshold = 0.25,
  min.pct         = 0.1
)

markers_cl20 <- FindMarkers(
  obj_all,
  ident.1         = "20",
  assay           = "SCT",
  slot            = "data",
  logfc.threshold = 0.25,
  min.pct         = 0.1
)

markers_cl16 <- FindMarkers(
  obj_all,
  ident.1         = "16",
  assay           = "SCT",
  slot            = "data",
  logfc.threshold = 0.25,
  min.pct         = 0.1
)

# Inspect the top 20 markers for each cluster
head(markers_cl6[order(-markers_cl6$avg_log2FC), ], 20)
head(markers_cl2[order(-markers_cl2$avg_log2FC),  ], 20)
head(markers_cl9[order(-markers_cl9$avg_log2FC),  ], 20)
head(markers_cl20[order(-markers_cl20$avg_log2FC),  ], 20)

4.2 Importing Google Calc to verify certain candidates found in the literature

Code

sheet_url <- "https://docs.google.com/spreadsheets/d/1pL6r-ZwITYZoVLR7xS-OkTkGWVkothUbsY0klSni45c/edit?gid=399921653#gid=399921653"
gs4_deauth()
candidates <- read_sheet(
  ss = sheet_url,
  sheet = "Candidates"
) %>%
  janitor::clean_names()

# Display as an interactive, filterable table
datatable(
  candidates,
  filter = "top",        # column filters
  rownames = FALSE,
  extensions = c("Buttons"),
  options = list(
    pageLength = 25,
    autoWidth = TRUE,
    dom = "Bfrtip",
    buttons = c("copy", "csv", "excel")
  )
)

Code

write_csv(candidates, file = here::here("data/output/candidates/candidates.csv"), na = "")

4.3 Markers for certain clusters and tissues

Code

# ----------------------------
# Helpers
# ----------------------------

strip_version <- function(x) sub("\\.v[0-9.]+$", "", x)

safe_dir_create <- function(path) {
  dir.create(path, recursive = TRUE, showWarnings = FALSE)
  stopifnot(dir.exists(path))
  invisible(path)
}


anno_row_kv <- function(annotation_row) {
  if (is.null(annotation_row) || nrow(annotation_row) == 0) {
    return(tibble::tibble(field = character(), value = character()))
  }
  annotation_row <- dplyr::slice(annotation_row, 1)  # au cas où plusieurs lignes

  tibble::tibble(
    field = names(annotation_row),
    value = vapply(annotation_row, function(x) {
      # rend lisible même si c'est une liste / plusieurs valeurs
      if (is.list(x)) paste(unlist(x), collapse = "; ") else paste(x, collapse = "; ")
    }, FUN.VALUE = character(1))
  )
}

go_long_kv <- function(anno_go_long) {
  if (is.null(anno_go_long) || nrow(anno_go_long) == 0) {
    return(tibble::tibble(field = character(), value = character()))
  }

  tibble::tibble(field = names(anno_go_long)) |>
    dplyr::mutate(
      value = vapply(field, function(f) {
        x <- anno_go_long[[f]]
        x <- unique(as.character(x))
        x <- x[!is.na(x) & x != ""]
        paste(x, collapse = "; ")
      }, FUN.VALUE = character(1))
    )
}

get_jgi_annotation_for_gene <- function(gene_id, jgi_anno) {

  gene_id_clean <- strip_version(gene_id)

  jgi_anno2 <- jgi_anno %>%
    mutate(
      locus_clean      = strip_version(locusName),
      transcript_clean = strip_version(transcriptName)
    )

  anno_gene <- jgi_anno2 %>%
    filter(locus_clean == gene_id_clean | transcript_clean == gene_id_clean)

  # Extract ALL GO IDs robustly (regex)
  go_list <- stringr::str_extract_all(anno_gene$GO %||% "", "GO:\\d{7}")
  go_vec  <- unique(unlist(go_list))
  go_vec  <- go_vec[!is.na(go_vec) & go_vec != ""]

  # Long format
  anno_go_long <- tibble::tibble(
    locusName      = anno_gene$locusName,
    transcriptName = anno_gene$transcriptName,
    peptideName    = anno_gene$peptideName,
    go_id_list     = go_list
  ) %>%
    tidyr::unnest(go_id_list) %>%
    dplyr::rename(go_id = go_id_list) %>%
    dplyr::filter(!is.na(go_id), go_id != "") %>%
    dplyr::distinct()

  # Try GO.db annotations (TERM / ONTOLOGY / DEFINITION)
  go_annot <- NULL
  if (length(go_vec) > 0 &&
      requireNamespace("GO.db", quietly = TRUE) &&
      requireNamespace("AnnotationDbi", quietly = TRUE)) {

    go_annot <- tryCatch({
      res <- AnnotationDbi::select(
        GO.db::GO.db,
        keys     = go_vec,
        columns  = c("TERM", "ONTOLOGY", "DEFINITION"),
        keytype  = "GOID"
      )
      dplyr::rename(res, go_id = GOID)
    }, error = function(e) {
      # fallback without DEFINITION
      tryCatch({
        res <- AnnotationDbi::select(
          GO.db::GO.db,
          keys     = go_vec,
          columns  = c("TERM", "ONTOLOGY"),
          keytype  = "GOID"
        )
        dplyr::rename(res, go_id = GOID)
      }, error = function(e2) NULL)
    })

    if (!is.null(go_annot)) {
      anno_go_long <- anno_go_long %>%
        dplyr::left_join(go_annot, by = "go_id")
    }
  }

  list(
    anno_gene    = anno_gene,
    anno_go_long = anno_go_long,
    go_terms     = go_vec,
    go_annot     = go_annot
  )
}

`%||%` <- function(a, b) if (is.null(a)) b else a

get_gtf_features_for_gene <- function(gene_id, gtf) {
  info_gene <- gtf[gtf$gene_id == gene_id]

  if (length(info_gene) == 0) {
    stop("No GTF entries found for gene_id = ", gene_id)
  }

  gene_range <- range(info_gene)

  gene_all <- data.frame(
    gene_id        = info_gene$gene_id,
    gene_name      = info_gene$gene_name,
    transcript_id  = info_gene$transcript_id,
    type           = as.character(info_gene$type),
    source         = as.character(info_gene$source),
    score          = info_gene$score,
    phase          = info_gene$phase,
    seqname        = as.character(seqnames(info_gene)),
    start          = start(info_gene),
    end            = end(info_gene),
    strand         = as.character(strand(info_gene)),
    width          = width(info_gene),
    stringsAsFactors = FALSE
  ) %>%
    distinct() %>%
    arrange(transcript_id, type, start, end)

  by_type <- split(gene_all, gene_all$type)

  per_transcript <- gene_all %>%
    filter(!is.na(transcript_id)) %>%
    group_by(transcript_id, type) %>%
    summarise(
      n_features = n(),
      total_bp   = sum(width, na.rm = TRUE),
      .groups = "drop"
    ) %>%
    arrange(transcript_id, desc(total_bp))

  overview <- list(
    gene_id        = unique(gene_all$gene_id),
    gene_name      = unique(gene_all$gene_name),
    seqname        = unique(gene_all$seqname),
    strand         = unique(gene_all$strand),
    start          = start(gene_range),
    end            = end(gene_range),
    gene_length_bp = width(gene_range),
    n_transcripts  = length(unique(na.omit(gene_all$transcript_id))),
    feature_counts = sort(table(gene_all$type), decreasing = TRUE)
  )

  list(
    info_gene = info_gene,
    overview = overview,
    tables = list(
      all = gene_all,
      by_type = by_type,
      exons = if ("exon" %in% names(by_type)) by_type[["exon"]] else NULL,
      cds   = if ("CDS"  %in% names(by_type)) by_type[["CDS"]]  else NULL,
      transcripts = if ("transcript" %in% names(by_type)) by_type[["transcript"]] else NULL,
      per_transcript = per_transcript
    )
  )
}

get_candidates_info <- function(gene_id, df_candidates) {
  # tries multiple common column names; returns NULL if none match
  if (is.null(df_candidates) || nrow(df_candidates) == 0) return(NULL)

  gene_clean <- strip_version(gene_id)

  possible_cols <- c("gene_id", "gene", "geneid", "id", "locusName", "locus", "feature_id")
  present_cols <- intersect(possible_cols, names(df_candidates))
  if (length(present_cols) == 0) return(NULL)

  # try matching in any of these columns
  out <- NULL
  for (col in present_cols) {
    x <- df_candidates[[col]]
    x_clean <- strip_version(as.character(x))
    idx <- which(x_clean == gene_clean)
    if (length(idx) > 0) {
      out <- df_candidates[idx, , drop = FALSE]
      break
    }
  }
  out
}

# ----------------------------
# Main: build and save summary
# ----------------------------

build_and_save_gene_summary <- function(
  gene_id,
  gtf,
  jgi_anno_file,
  candidates_csv = NULL,
  out_base = here("report/snrnaseq/plot/marker")
) {
  # load JGI annotation
  jgi_anno <- read_tsv(jgi_anno_file, show_col_types = FALSE)

  # load candidates if provided
  df_candidates <- NULL
  if (!is.null(candidates_csv) && file.exists(candidates_csv)) {
    df_candidates <- read_csv(candidates_csv, show_col_types = FALSE)
  }

  # output directory
  path_gene <- safe_dir_create(file.path(out_base, gene_id))

  # GTF part
  gtf_res <- get_gtf_features_for_gene(gene_id, gtf)

  # JGI part (may be empty if not found)
  jgi_res <- get_jgi_annotation_for_gene(gene_id, jgi_anno)
  
  jgi_go_kv <- go_long_kv(jgi_res$anno_go_long)
  # candidates part (optional)
  cand_res <- get_candidates_info(gene_id, df_candidates)
  
  jgi_row_kv <- anno_row_kv(jgi_res$anno_gene)

  # assemble all-in-one object
gene_summary <- list(
  input = list(
    gene_id = gene_id,
    gene_id_clean = strip_version(gene_id),
    jgi_anno_file = jgi_anno_file,
    candidates_csv = candidates_csv,
    out_dir = path_gene
  ),
  overview = gtf_res$overview,

  # <--- THIS is what you want:
  tables = gtf_res$tables,

  jgi = list(
    annotation_row = jgi_row_kv,
    go_terms       = jgi_res$go_terms,
    go_long        = jgi_res$anno_go_long,  # tu peux garder la table longue
    go_kv          = jgi_go_kv,             # <- version “en colonne”
    go_annot       = jgi_res$go_annot
  ),
  candidates = cand_res
)

  # save RDS (main)
saveRDS(gene_summary, file.path(path_gene, "gene_summary.rds"))

  # helpful exports (optional but nice)
  write.csv(gtf_res$tables$all, file.path(path_gene, "gtf_all_features.csv"), row.names = FALSE)

  if (!is.null(jgi_res$anno_gene) && nrow(jgi_res$anno_gene) > 0) {
    write.csv(jgi_res$anno_gene, file.path(path_gene, "jgi_annotation.csv"), row.names = FALSE)
  }
  if (!is.null(jgi_res$anno_go_long) && nrow(jgi_res$anno_go_long) > 0) {
    write.csv(jgi_res$anno_go_long, file.path(path_gene, "jgi_go_terms_long.csv"), row.names = FALSE)
  }
  if (!is.null(cand_res) && nrow(cand_res) > 0) {
    write.csv(cand_res, file.path(path_gene, "candidates_row.csv"), row.names = FALSE)
  }

  return(gene_summary)
}

# ----------------------------
# Data
# ----------------------------
df_candidates<- read_csv(here::here("data/output/candidates/candidates.csv"))
path_output_marker<-here::here("report/snrnaseq/plot/marker")
DefaultAssay(obj_all) <- "SCT"
Idents(obj_all)       <- obj_all$seurat_clusters
# Prepare SCT models for marker testing (needed once per object)
obj_all <- PrepSCTFindMarkers(obj_all)

# ----------------------------
# Example usage
# ----------------------------

gene_id <- "BdiBd21-3.4G0260700.v1.2"  # example top marker for a pericycle-related cluster
gene_base2 <- "BdiBd21-3.5G0204500"
gene_id <- "BdiBd21-3.4G0260700.v1.2"
gene_id <- "BdiBd21-3.5G0204500.v1.2"
gene_id <- "BdiBd21-3.2G0308600.v1.2" # Best from 9 with GO
# LOAD GJI info 
# anno_file <- here::here("data/inputs_ref/JGI/BdistachyonBd21_3_537_v1.2.P14.annotation_info.txt.gz") 
# jgi_anno <- read_tsv(anno_file, show_col_types = FALSE)

# 
# gene_id_clean <- strip_version(gene_id)
# 
# jgi_anno2 <- jgi_anno %>%
#   mutate(
#     locus_clean      = strip_version(locusName),
#     transcript_clean = strip_version(transcriptName)
#   )

# Try matching by locusName first, otherwise transcriptName
# anno_gene <- jgi_anno2 %>%
#   filter(locus_clean == gene_id_clean | transcript_clean == gene_id_clean)



# function to create all plot but also function that regroup all info. 

export_gene_marker_plots_and_summary<-function(gene_id){
  print(gene_id)
path_gene <- file.path(path_output_marker, gene_id)

gene_summary <- build_and_save_gene_summary(
  gene_id = gene_id,
  gtf = gtf,
  jgi_anno_file = here("data/inputs_ref/JGI/BdistachyonBd21_3_537_v1.2.P14.annotation_info.txt.gz"),
  candidates_csv = here("data/output/candidates/candidates.csv"),
  out_base = here("report/snrnaseq/plot/marker")
)

# gene_summary$overview
# gene_summary$jgi$go_terms
# gene_summary$tables$all
# 
# gene_summary$jgi$go_annot
# gene_summary$jgi$annotation_row
# gene_summary$jgi$go_long


#### Cluster-wise average expression for the example gene ----
get_gene_cluster_means <- function(obj, gene_id,
                                   assay = "SCT",
                                   layer = "counts",
                                   ident_col = "seurat_clusters") {
  DefaultAssay(obj) <- assay
  Idents(obj)       <- obj[[ident_col]][, 1]

  mat <- GetAssayData(obj, assay = assay, layer = layer)

  if (!gene_id %in% rownames(mat)) {
    stop("Gene ", gene_id, " is not present in layer '", layer, "' of assay ", assay, ".")
  }

  expr_vec <- as.numeric(mat[gene_id, ])
  cl       <- as.factor(Idents(obj))

  mean_by_cl <- tapply(expr_vec, cl, mean, na.rm = TRUE)

  tibble(
    cluster   = names(mean_by_cl),
    mean_expr = as.numeric(mean_by_cl)
  )
}

p_mean <- get_gene_cluster_means(
  obj_all,
  gene_id = gene_id,
  assay   = "SCT",
  layer   = "counts"   # or "data" if you prefer SCT residuals
) %>% ggplot(., aes(x = cluster, y = mean_expr)) +
  geom_col() +
  theme_bw() +
  labs(
    x = "Cluster",
    y = paste("Mean", gene_id, "expression (", DefaultAssay(obj_all), "/", "counts", ")", sep = ""),
    title = paste("Average expression of", gene_id, "per cluster")
  )

fig_export(
  path    = paste0(path_gene,"/","mean_per_cluster"),
  plot_x  = p_mean,
  height_i = 4.5,
  width_i  = 6,
  res_i    = 300,
  format   = "png"
)

# Mean expression by cluster and timepoint (heatmap)
if ("timepoint" %in% colnames(obj_all@meta.data)) {
  DefaultAssay(obj_all) <- "SCT"

  mat_ct <- GetAssayData(obj_all, assay = "SCT", layer = "counts")
  stopifnot(gene_id %in% rownames(mat_ct))

  expr_vec_ct <- as.numeric(mat_ct[gene_id, ])
  meta_ct     <- obj_all@meta.data

  # Force timepoint order: 0, 4, 6, 8, 12 (with or without 'h')
  tp_vals <- as.character(meta_ct$timepoint)
  tp_vals <- gsub("\\s+", "", tp_vals)

  has_h <- any(grepl("h$", tp_vals, ignore.case = TRUE))
  desired_tp <- if (has_h) c("0h", "4h", "6h", "8h", "12h") else c("0", "4", "6", "8", "12")

  # keep only levels that exist
  desired_tp <- desired_tp[desired_tp %in% unique(tp_vals)]
  meta_ct$timepoint <- if (length(desired_tp) >= 2) factor(tp_vals, levels = desired_tp) else factor(tp_vals)

  df_ct <- tibble::tibble(
    cluster   = as.factor(meta_ct$seurat_clusters),
    timepoint = meta_ct$timepoint,
    expr      = expr_vec_ct
  ) |>
    dplyr::group_by(cluster, timepoint) |>
    dplyr::summarise(mean_expr = mean(expr, na.rm = TRUE), .groups = "drop")

  p_mean_ct <- ggplot(df_ct, aes(x = timepoint, y = cluster, fill = mean_expr)) +
    geom_tile() +
    scale_fill_gradient(low = "grey90", high = "purple") +
    theme_bw() +
    labs(
      x = "Timepoint",
      y = "Cluster",
      fill = "Mean expression",
      title = paste("Mean", gene_id, "expression by cluster and timepoint")
    )+ scale_y_discrete(limits = rev)

  fig_export(
    path    = paste0(path_gene, "/", "mean_cluster_timepoint"),
    plot_x  = p_mean_ct,
    height_i = 4,
    width_i  = 7,
    res_i    = 300,
    format   = "png"
  )
}

# Violin and UMAP views for the example marker ----
 # if you want to combine plots later

plot_gene_violin_umap <- function(
  obj,
  gene_id,
  assay       = "SCT",
  cluster_col = "seurat_clusters",
  tp_col      = "timepoint",
  reduction   = "umap",
  expr_layer  = "data",   # "data" or "counts"
  pt_size     = 0.1,
  tp_order    = c("0", "4", "6", "8", "12")  # desired order (without 'h')
) {
  # packages
  # Seurat, ggplot2, patchwork (for plot_layout/plot_annotation)

  # Assay & identities
  DefaultAssay(obj) <- assay
  if (!cluster_col %in% colnames(obj@meta.data)) {
    stop("Column '", cluster_col, "' not found in obj@meta.data.")
  }
  Idents(obj) <- as.factor(obj@meta.data[[cluster_col]])

  # Check gene existence in the requested layer
  mat <- tryCatch(
    GetAssayData(obj, assay = assay, layer = expr_layer),
    error = function(e) GetAssayData(obj, assay = assay, slot = expr_layer) # Seurat v4 fallback
  )
  if (!gene_id %in% rownames(mat)) {
    stop("Gene ", gene_id, " is not present in assay ", assay, " / layer ", expr_layer, ".")
  }

  ## 1) Violin plot by cluster
  p_violin <- tryCatch(
    VlnPlot(
      obj,
      features = gene_id,
      group.by = cluster_col,
      assay    = assay,
      layer    = expr_layer,
      pt.size  = pt_size
    ),
    error = function(e) {
      # Seurat v4 fallback
      VlnPlot(
        obj,
        features = gene_id,
        group.by = cluster_col,
        assay    = assay,
        slot     = expr_layer,
        pt.size  = pt_size
      )
    }
  ) +
    theme_bw() +
    theme(
      axis.text.x = element_text(angle = 45, hjust = 1),
      plot.title  = element_text(face = "bold")
    ) +
    labs(
      x = "Cluster",
      y = paste0(gene_id, " expression (", assay, "/", expr_layer, ")"),
      title = paste("Expression of", gene_id, "by cluster")
    )

  ## 2) UMAP feature plot (all timepoints combined)
  p_umap <- FeaturePlot(
    obj,
    features  = gene_id,
    reduction = reduction,
    order     = TRUE
  ) +
    theme_bw() +
    theme(
      axis.text  = element_blank(),
      axis.title = element_blank(),
      axis.ticks = element_blank(),
      plot.title = element_text(face = "bold")
    ) +
    labs(title = paste("UMAP -", gene_id))

  ## 3) Optional UMAP split by timepoint (ordered panels)
  p_umap_split <- NULL
  if (!is.null(tp_col) && tp_col %in% colnames(obj@meta.data)) {

    # Force timepoint order by setting factor levels
    tp_vals <- as.character(obj@meta.data[[tp_col]])
    tp_vals <- gsub("\\s+", "", tp_vals)

    # Detect whether your timepoints include 'h' suffix
    has_h <- any(grepl("h$", tp_vals, ignore.case = TRUE))

    if (has_h) {
      desired_levels <- paste0(tp_order, "h")
    } else {
      desired_levels <- tp_order
    }

    # Apply factor with desired order; keep only levels that exist in data
    desired_levels <- desired_levels[desired_levels %in% unique(tp_vals)]
    if (length(desired_levels) >= 2) {
      obj@meta.data[[tp_col]] <- factor(tp_vals, levels = desired_levels)
    } else {
      # fallback: keep existing order if we can't match
      obj@meta.data[[tp_col]] <- factor(tp_vals)
    }

    p_umap_split <- FeaturePlot(
      obj,
      features    = gene_id,
      reduction   = reduction,
      split.by    = tp_col,
      ncol        = min(4, length(levels(obj@meta.data[[tp_col]]))),
      order       = TRUE,
      keep.scale  = "all"
    ) &
      theme_bw() &
      theme(
        axis.text  = element_blank(),
        axis.title = element_blank(),
        axis.ticks = element_blank(),
        plot.title = element_text(face = "bold")
      )

    p_umap_split <- p_umap_split +
      patchwork::plot_layout(guides = "collect") +
      patchwork::plot_annotation(title = paste("UMAP split by", tp_col, "-", gene_id)) &
      theme(legend.position = "right")
  }

  list(
    violin     = p_violin,
    umap       = p_umap,
    umap_split = p_umap_split
  )
}

# execute ----
plots_gene <- plot_gene_violin_umap(
  obj         = obj_all,
  gene_id     = gene_id,
  assay       = "SCT",
  cluster_col = "seurat_clusters",
  tp_col      = "timepoint",
  reduction   = "umap"
)

# Export example marker plots
fig_export(
  path    = paste0(path_gene,"/","violin_SCT_cluster"),
  plot_x  = plots_gene$violin,
  height_i = 14,
  width_i  = 17,
  res_i    = 300,
  format   = "png"
)

fig_export(
  path    = paste0(path_gene,"/","umap"),
  plot_x  = plots_gene$umap,
  height_i = 14,
  width_i  = 16,
  res_i    = 300,
  format   = "png"
)

if (!is.null(plots_gene$umap_split)) {
  fig_export(
    path    = paste0(path_gene,"/","umap_split"),
    plot_x  = plots_gene$umap_split,
    height_i = 10,
    width_i  = 24,
    res_i    = 300,
    format   = "png"
  )
}
}

export_gene_marker_plots_and_summary("BdiBd21-3.1G0921900.v1.2")

gene_ids <- unique(paste0(candidates$brachypodium_gene_id, ".v1.2"))
gene_ids <-markers_cl20 %>%  tibble::rownames_to_column("gene") %>%  dplyr::arrange(dplyr::desc(avg_log2FC)) %>% dplyr::slice_head(n = 10) %>%   dplyr::pull(gene) # 10 first from cluster 20
gene_ids <-markers_cl16 %>%  tibble::rownames_to_column("gene") %>%  dplyr::arrange(dplyr::desc(avg_log2FC)) %>% dplyr::slice_head(n = 10) %>%   dplyr::pull(gene) # 10 first from cluster 16
to_remove <- c(
  "BdiBd21-3.1G0589500.v1.2"
  #"BdiBd21-3.2G0000000.v1.2"
)

gene_ids <- setdiff(gene_ids, to_remove)
# warning some are not in our genome

purrr::walk(gene_ids, export_gene_marker_plots_and_summary)

key	value
gene_id	BdiBd21-3.1G0383400.v1.2
gene_name	NA
seqname	Bd1
strand	-
start	24598520
end	24600112
gene_length_bp	1593
n_transcripts	1
feature_counts	exon: 3; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0383400.v1.2	NA	BdiBd21-3.1G0383400.1.v1.2	exon	phytozomev13	NA	NA	Bd1	24598520	24598852	-	333
BdiBd21-3.1G0383400.v1.2	NA	BdiBd21-3.1G0383400.1.v1.2	exon	phytozomev13	NA	NA	Bd1	24599472	24599566	-	95
BdiBd21-3.1G0383400.v1.2	NA	BdiBd21-3.1G0383400.1.v1.2	exon	phytozomev13	NA	NA	Bd1	24599688	24600112	-	425
BdiBd21-3.1G0383400.v1.2	NA	BdiBd21-3.1G0383400.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	24598520	24600112	-	1593

field	value
#pacId	PAC:42966526
locusName	BdiBd21-3.1G0383400
transcriptName	BdiBd21-3.1G0383400.1
peptideName	BdiBd21-3.1G0383400.1.p
Pfam	PF05922
Panther	PTHR48222:SF7
ec	NA
KOG	EC:3.4.21.62
KO	NA
GO	NA
Best-hit-arabi-name	AT1G71950
Best-hit-arabi-defline	(1 of 2) PTHR48222:SF4 - PROTEINASE INHIBITOR, PROPEPTIDE
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os07g25690
Best-hit-rice-defline	(1 of 1) PTHR48222:SF7 - OS07G0438600 PROTEIN
locus_clean	BdiBd21-3.1G0383400
transcript_clean	BdiBd21-3.1G0383400.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.1G0400200.v1.2
gene_name	NA
seqname	Bd1
strand	-
start	25760875
end	25763449
gene_length_bp	2575
n_transcripts	1
feature_counts	exon: 7; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0400200.v1.2	NA	BdiBd21-3.1G0400200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	25760875	25761430	-	556
BdiBd21-3.1G0400200.v1.2	NA	BdiBd21-3.1G0400200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	25761538	25761591	-	54
BdiBd21-3.1G0400200.v1.2	NA	BdiBd21-3.1G0400200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	25761710	25761780	-	71
BdiBd21-3.1G0400200.v1.2	NA	BdiBd21-3.1G0400200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	25762404	25762477	-	74
BdiBd21-3.1G0400200.v1.2	NA	BdiBd21-3.1G0400200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	25762691	25762810	-	120
BdiBd21-3.1G0400200.v1.2	NA	BdiBd21-3.1G0400200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	25762934	25763032	-	99
BdiBd21-3.1G0400200.v1.2	NA	BdiBd21-3.1G0400200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	25763153	25763449	-	297
BdiBd21-3.1G0400200.v1.2	NA	BdiBd21-3.1G0400200.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	25760875	25763449	-	2575

field	value
#pacId	PAC:42968219
locusName	BdiBd21-3.1G0400200
transcriptName	BdiBd21-3.1G0400200.1
peptideName	BdiBd21-3.1G0400200.1.p
Pfam	PF00581
Panther	PTHR45431:SF3
ec	KOG1530
KOG	EC:2.8.1.1
KO	NA
GO	NA
Best-hit-arabi-name	AT4G35770
Best-hit-arabi-defline	(1 of 1) PTHR45431:SF3 - RHODANESE-LIKE DOMAIN-CONTAINING PROTEIN 15, CHLOROPLASTIC
Best-hit-clamy-name	Cre10.g444500
Best-hit-clamy-defline	(1 of 2) PTHR45431:SF3 - RHODANESE-LIKE DOMAIN-CONTAINING PROTEIN 15, CHLOROPLASTIC
Best-hit-rice-name	LOC_Os06g50930
Best-hit-rice-defline	(1 of 1) PTHR45431:SF3 - RHODANESE-LIKE DOMAIN-CONTAINING PROTEIN 15, CHLOROPLASTIC
locus_clean	BdiBd21-3.1G0400200
transcript_clean	BdiBd21-3.1G0400200.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.1G0514700.v1.2
gene_name	NA
seqname	Bd1
strand	+
start	34369737
end	34376836
gene_length_bp	7100
n_transcripts	1
feature_counts	exon: 7; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0514700.v1.2	NA	BdiBd21-3.1G0514700.1.v1.2	exon	phytozomev13	NA	NA	Bd1	34369737	34370105	+	369
BdiBd21-3.1G0514700.v1.2	NA	BdiBd21-3.1G0514700.1.v1.2	exon	phytozomev13	NA	NA	Bd1	34370200	34370350	+	151
BdiBd21-3.1G0514700.v1.2	NA	BdiBd21-3.1G0514700.1.v1.2	exon	phytozomev13	NA	NA	Bd1	34374364	34374560	+	197
BdiBd21-3.1G0514700.v1.2	NA	BdiBd21-3.1G0514700.1.v1.2	exon	phytozomev13	NA	NA	Bd1	34374698	34375162	+	465
BdiBd21-3.1G0514700.v1.2	NA	BdiBd21-3.1G0514700.1.v1.2	exon	phytozomev13	NA	NA	Bd1	34375259	34375679	+	421
BdiBd21-3.1G0514700.v1.2	NA	BdiBd21-3.1G0514700.1.v1.2	exon	phytozomev13	NA	NA	Bd1	34375787	34375914	+	128
BdiBd21-3.1G0514700.v1.2	NA	BdiBd21-3.1G0514700.1.v1.2	exon	phytozomev13	NA	NA	Bd1	34376014	34376836	+	823
BdiBd21-3.1G0514700.v1.2	NA	BdiBd21-3.1G0514700.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	34369737	34376836	+	7100

field	value
#pacId	PAC:42963861
locusName	BdiBd21-3.1G0514700
transcriptName	BdiBd21-3.1G0514700.1
peptideName	BdiBd21-3.1G0514700.1.p
Pfam	PF06963
Panther	PTHR11660:SF57
ec	KOG2601
KOG	NA
KO	K14685
GO	GO:0005381 GO:0016020 GO:0034755
Best-hit-arabi-name	AT5G03570
Best-hit-arabi-defline	(1 of 1) PTHR11660:SF57 - PROTEIN FPN-1.2
Best-hit-clamy-name	Cre16.g687000
Best-hit-clamy-defline	(1 of 1) K14685 - solute carrier family 40 (iron-regulated transporter), member 1 (SLC40A1, FPN1)
Best-hit-rice-name	LOC_Os06g36450
Best-hit-rice-defline	(1 of 1) K14685 - solute carrier family 40 (iron-regulated transporter), member 1 (SLC40A1, FPN1)
locus_clean	BdiBd21-3.1G0514700
transcript_clean	BdiBd21-3.1G0514700.1

field	value
locusName	BdiBd21-3.1G0514700
transcriptName	BdiBd21-3.1G0514700.1
peptideName	BdiBd21-3.1G0514700.1.p
go_id	GO:0005381; GO:0016020; GO:0034755
TERM	iron ion transmembrane transporter activity; membrane; iron ion transmembrane transport
ONTOLOGY	MF; CC; BP
DEFINITION	Enables the transfer of iron (Fe) ions from one side of a membrane to the other.; A lipid bilayer along with all the proteins and protein complexes embedded in it and attached to it.; A process in which an iron ion is transported from one side of a membrane to the other by means of some agent such as a transporter or pore.

key	value
gene_id	BdiBd21-3.1G0559800.v1.2
gene_name	NA
seqname	Bd1
strand	+
start	41106823
end	41109413
gene_length_bp	2591
n_transcripts	1
feature_counts	exon: 4; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0559800.v1.2	NA	BdiBd21-3.1G0559800.1.v1.2	exon	phytozomev13	NA	NA	Bd1	41106823	41107314	+	492
BdiBd21-3.1G0559800.v1.2	NA	BdiBd21-3.1G0559800.1.v1.2	exon	phytozomev13	NA	NA	Bd1	41107378	41107666	+	289
BdiBd21-3.1G0559800.v1.2	NA	BdiBd21-3.1G0559800.1.v1.2	exon	phytozomev13	NA	NA	Bd1	41108405	41108474	+	70
BdiBd21-3.1G0559800.v1.2	NA	BdiBd21-3.1G0559800.1.v1.2	exon	phytozomev13	NA	NA	Bd1	41108634	41109413	+	780
BdiBd21-3.1G0559800.v1.2	NA	BdiBd21-3.1G0559800.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	41106823	41109413	+	2591

field	value
#pacId	PAC:42961410
locusName	BdiBd21-3.1G0559800
transcriptName	BdiBd21-3.1G0559800.1
peptideName	BdiBd21-3.1G0559800.1.p
Pfam	PF13561
Panther	PTHR43899:SF42
ec	KOG1014
KOG	EC:1.1.1.330
KO	K10251
GO	NA
Best-hit-arabi-name	AT1G67730
Best-hit-arabi-defline	(1 of 1) K10251 - 17beta-estradiol 17-dehydrogenase / very-long-chain 3-oxoacyl-CoA reductase (HSD17B12, KAR, IFA38)
Best-hit-clamy-name	Cre09.g392430
Best-hit-clamy-defline	(1 of 1) 1.1.1.62 - 17beta-estradiol 17-dehydrogenase. / estrogen 17-oxidoreductase.
Best-hit-rice-name	LOC_Os06g19590
Best-hit-rice-defline	(1 of 1) PTHR43899:SF42 - OS06G0300000 PROTEIN
locus_clean	BdiBd21-3.1G0559800
transcript_clean	BdiBd21-3.1G0559800.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.1G0589500.v1.2
gene_name	NA
seqname	Bd1
strand	-
start	43692787
end	43693596
gene_length_bp	810
n_transcripts	1
feature_counts	exon: 3; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0589500.v1.2	NA	BdiBd21-3.1G0589500.1.v1.2	exon	phytozomev13	NA	NA	Bd1	43692787	43693002	-	216
BdiBd21-3.1G0589500.v1.2	NA	BdiBd21-3.1G0589500.1.v1.2	exon	phytozomev13	NA	NA	Bd1	43693161	43693284	-	124
BdiBd21-3.1G0589500.v1.2	NA	BdiBd21-3.1G0589500.1.v1.2	exon	phytozomev13	NA	NA	Bd1	43693382	43693596	-	215
BdiBd21-3.1G0589500.v1.2	NA	BdiBd21-3.1G0589500.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	43692787	43693596	-	810

field	value
#pacId	PAC:42962035
locusName	BdiBd21-3.1G0589500
transcriptName	BdiBd21-3.1G0589500.1
peptideName	BdiBd21-3.1G0589500.1.p
Pfam	PF04535
Panther	PTHR36488:SF8
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	AT5G15290
Best-hit-arabi-defline	(1 of 13) PTHR36488:SF8 - CASP-LIKE PROTEIN 1U1
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os06g12500
Best-hit-rice-defline	(1 of 11) PTHR36488:SF8 - CASP-LIKE PROTEIN 1U1
locus_clean	BdiBd21-3.1G0589500
transcript_clean	BdiBd21-3.1G0589500.1

table vide/incorrecte

umap.png absent

umap_split.png absent

mean_per_cluster_path.png absent

violin_SCT_cluster_path.png absent

mean_cluster_timepoint_path.png absent

key	value
gene_id	BdiBd21-3.1G0830100.v1.2
gene_name	NA
seqname	Bd1
strand	+
start	61328740
end	61333674
gene_length_bp	4935
n_transcripts	1
feature_counts	exon: 2; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0830100.v1.2	NA	BdiBd21-3.1G0830100.1.v1.2	exon	phytozomev13	NA	NA	Bd1	61328740	61329778	+	1039
BdiBd21-3.1G0830100.v1.2	NA	BdiBd21-3.1G0830100.1.v1.2	exon	phytozomev13	NA	NA	Bd1	61332494	61333674	+	1181
BdiBd21-3.1G0830100.v1.2	NA	BdiBd21-3.1G0830100.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	61328740	61333674	+	4935

field	value
#pacId	PAC:42965332
locusName	BdiBd21-3.1G0830100
transcriptName	BdiBd21-3.1G0830100.1
peptideName	BdiBd21-3.1G0830100.1.p
Pfam	PF00324
Panther	PTHR45826:SF22
ec	KOG1287
KOG	NA
KO	NA
GO	GO:0016020 GO:0055085
Best-hit-arabi-name	AT3G13620
Best-hit-arabi-defline	(1 of 1) PTHR45826:SF8 - AA_PERMEASE DOMAIN-CONTAINING PROTEIN
Best-hit-clamy-name	Cre06.g292350
Best-hit-clamy-defline	(1 of 1) PTHR45826:SF2 - ACID PERMEASE FAMILY PROTEIN, PUTATIVE, EXPRESSED-RELATED
Best-hit-rice-name	LOC_Os03g25920
Best-hit-rice-defline	(1 of 1) PTHR45826:SF18 - AA_PERMEASE DOMAIN-CONTAINING PROTEIN
locus_clean	BdiBd21-3.1G0830100
transcript_clean	BdiBd21-3.1G0830100.1

field	value
locusName	BdiBd21-3.1G0830100
transcriptName	BdiBd21-3.1G0830100.1
peptideName	BdiBd21-3.1G0830100.1.p
go_id	GO:0016020; GO:0055085
TERM	membrane; transmembrane transport
ONTOLOGY	CC; BP
DEFINITION	A lipid bilayer along with all the proteins and protein complexes embedded in it and attached to it.; The process in which a solute is transported across a lipid bilayer, from one side of a membrane to the other.

key	value
gene_id	BdiBd21-3.1G0868200.v1.2
gene_name	NA
seqname	Bd1
strand	+
start	64191338
end	64193150
gene_length_bp	1813
n_transcripts	1
feature_counts	exon: 5; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0868200.v1.2	NA	BdiBd21-3.1G0868200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	64191338	64191824	+	487
BdiBd21-3.1G0868200.v1.2	NA	BdiBd21-3.1G0868200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	64191926	64192088	+	163
BdiBd21-3.1G0868200.v1.2	NA	BdiBd21-3.1G0868200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	64192187	64192393	+	207
BdiBd21-3.1G0868200.v1.2	NA	BdiBd21-3.1G0868200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	64192487	64192734	+	248
BdiBd21-3.1G0868200.v1.2	NA	BdiBd21-3.1G0868200.1.v1.2	exon	phytozomev13	NA	NA	Bd1	64192824	64193150	+	327
BdiBd21-3.1G0868200.v1.2	NA	BdiBd21-3.1G0868200.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	64191338	64193150	+	1813

field	value
#pacId	PAC:42958763
locusName	BdiBd21-3.1G0868200
transcriptName	BdiBd21-3.1G0868200.1
peptideName	BdiBd21-3.1G0868200.1.p
Pfam	PF01095
Panther	PTHR31321:SF98
ec	NA
KOG	EC:3.1.1.11
KO	NA
GO	GO:0030599 GO:0042545
Best-hit-arabi-name	AT3G17060
Best-hit-arabi-defline	(1 of 1) PTHR31321:SF98 - PECTINESTERASE 67-RELATED
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os03g19610
Best-hit-rice-defline	(1 of 1) PTHR31321:SF98 - PECTINESTERASE 67-RELATED
locus_clean	BdiBd21-3.1G0868200
transcript_clean	BdiBd21-3.1G0868200.1

field	value
locusName	BdiBd21-3.1G0868200
transcriptName	BdiBd21-3.1G0868200.1
peptideName	BdiBd21-3.1G0868200.1.p
go_id	GO:0030599; GO:0042545
TERM	pectinesterase activity; cell wall modification
ONTOLOGY	MF; BP
DEFINITION	Catalysis of the reaction: pectin + n H2O = n methanol + pectate.; The series of events leading to chemical and structural alterations of an existing cell wall that can result in loosening, increased extensibility or disassembly.

key	value
gene_id	BdiBd21-3.1G0877600.v1.2
gene_name	NA
seqname	Bd1
strand	-
start	64847468
end	64850473
gene_length_bp	3006
n_transcripts	1
feature_counts	exon: 4; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0877600.v1.2	NA	BdiBd21-3.1G0877600.1.v1.2	exon	phytozomev13	NA	NA	Bd1	64847468	64848848	-	1381
BdiBd21-3.1G0877600.v1.2	NA	BdiBd21-3.1G0877600.1.v1.2	exon	phytozomev13	NA	NA	Bd1	64849390	64849518	-	129
BdiBd21-3.1G0877600.v1.2	NA	BdiBd21-3.1G0877600.1.v1.2	exon	phytozomev13	NA	NA	Bd1	64849626	64850022	-	397
BdiBd21-3.1G0877600.v1.2	NA	BdiBd21-3.1G0877600.1.v1.2	exon	phytozomev13	NA	NA	Bd1	64850141	64850473	-	333
BdiBd21-3.1G0877600.v1.2	NA	BdiBd21-3.1G0877600.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	64847468	64850473	-	3006

field	value
#pacId	PAC:42959567
locusName	BdiBd21-3.1G0877600
transcriptName	BdiBd21-3.1G0877600.1
peptideName	BdiBd21-3.1G0877600.1.p
Pfam	PF00394 PF07731 PF07732
Panther	PTHR11709:SF287
ec	NA
KOG	EC:1.10.3.2
KO	K05909
GO	GO:0005507 GO:0016491
Best-hit-arabi-name	AT2G40370
Best-hit-arabi-defline	(1 of 1) PTHR11709:SF511 - LACCASE-5
Best-hit-clamy-name	Cre01.g031500
Best-hit-clamy-defline	(1 of 1) 1.10.3.2//1.10.3.3 - laccase. / urishiol oxidase. // L-ascorbate oxidase. / ascorbase.
Best-hit-rice-name	LOC_Os03g18640
Best-hit-rice-defline	(1 of 1) PTHR11709:SF287 - LACCASE
locus_clean	BdiBd21-3.1G0877600
transcript_clean	BdiBd21-3.1G0877600.1

field	value
locusName	BdiBd21-3.1G0877600
transcriptName	BdiBd21-3.1G0877600.1
peptideName	BdiBd21-3.1G0877600.1.p
go_id	GO:0005507; GO:0016491
TERM	copper ion binding; oxidoreductase activity
ONTOLOGY	MF
DEFINITION	Binding to a copper (Cu) ion.; Catalysis of an oxidation-reduction (redox) reaction, a reversible chemical reaction in which the oxidation state of an atom or atoms within a molecule is altered. One substrate acts as a hydrogen or electron donor and becomes oxidized, while the other acts as hydrogen or electron acceptor and becomes reduced.

key	value
gene_id	BdiBd21-3.1G0906700.v1.2
gene_name	NA
seqname	Bd1
strand	+
start	66615690
end	66617565
gene_length_bp	1876
n_transcripts	1
feature_counts	exon: 4; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0906700.v1.2	NA	BdiBd21-3.1G0906700.1.v1.2	exon	phytozomev13	NA	NA	Bd1	66615690	66616167	+	478
BdiBd21-3.1G0906700.v1.2	NA	BdiBd21-3.1G0906700.1.v1.2	exon	phytozomev13	NA	NA	Bd1	66616270	66616554	+	285
BdiBd21-3.1G0906700.v1.2	NA	BdiBd21-3.1G0906700.1.v1.2	exon	phytozomev13	NA	NA	Bd1	66616635	66616802	+	168
BdiBd21-3.1G0906700.v1.2	NA	BdiBd21-3.1G0906700.1.v1.2	exon	phytozomev13	NA	NA	Bd1	66616889	66617565	+	677
BdiBd21-3.1G0906700.v1.2	NA	BdiBd21-3.1G0906700.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	66615690	66617565	+	1876

field	value
#pacId	PAC:42966103
locusName	BdiBd21-3.1G0906700
transcriptName	BdiBd21-3.1G0906700.1
peptideName	BdiBd21-3.1G0906700.1.p
Pfam	PF08450 PF20067
Panther	PTHR10426:SF21
ec	KOG1520
KOG	EC:4.3.3.2
KO	NA
GO	NA
Best-hit-arabi-name	AT3G59530
Best-hit-arabi-defline	(1 of 1) PTHR10426:SF21 - POLLEN DEVELOPMENT PROTEIN LAP3
Best-hit-clamy-name	Cre12.g549050
Best-hit-clamy-defline	(1 of 1) 4.3.3.2 - strictosidine synthase. / strictosidine synthetase.
Best-hit-rice-name	LOC_Os03g15710
Best-hit-rice-defline	(1 of 1) PTHR10426:SF21 - POLLEN DEVELOPMENT PROTEIN LAP3
locus_clean	BdiBd21-3.1G0906700
transcript_clean	BdiBd21-3.1G0906700.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.1G0921900.v1.2
gene_name	NA
seqname	Bd1
strand	-
start	67607418
end	67608630
gene_length_bp	1213
n_transcripts	1
feature_counts	exon: 1; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0921900.v1.2	NA	BdiBd21-3.1G0921900.1.v1.2	exon	phytozomev13	NA	NA	Bd1	67607418	67608630	-	1213
BdiBd21-3.1G0921900.v1.2	NA	BdiBd21-3.1G0921900.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	67607418	67608630	-	1213

field	value
#pacId	PAC:42965383
locusName	BdiBd21-3.1G0921900
transcriptName	BdiBd21-3.1G0921900.1
peptideName	BdiBd21-3.1G0921900.1.p
Pfam	NA
Panther	PTHR36481:SF2
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	NA
Best-hit-arabi-defline	NA
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os03g14150
Best-hit-rice-defline	(1 of 136) IPR036426 - Bulb-type lectin domain superfamily
locus_clean	BdiBd21-3.1G0921900
transcript_clean	BdiBd21-3.1G0921900.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.1G0922000.v1.2
gene_name	NA
seqname	Bd1
strand	-
start	67612962
end	67614218
gene_length_bp	1257
n_transcripts	1
feature_counts	exon: 1; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0922000.v1.2	NA	BdiBd21-3.1G0922000.1.v1.2	exon	phytozomev13	NA	NA	Bd1	67612962	67614218	-	1257
BdiBd21-3.1G0922000.v1.2	NA	BdiBd21-3.1G0922000.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	67612962	67614218	-	1257

field	value
#pacId	PAC:42966816
locusName	BdiBd21-3.1G0922000
transcriptName	BdiBd21-3.1G0922000.1
peptideName	BdiBd21-3.1G0922000.1.p
Pfam	NA
Panther	PTHR36481:SF2
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	NA
Best-hit-arabi-defline	NA
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os03g14150
Best-hit-rice-defline	(1 of 136) IPR036426 - Bulb-type lectin domain superfamily
locus_clean	BdiBd21-3.1G0922000
transcript_clean	BdiBd21-3.1G0922000.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.1G0934100.v1.2
gene_name	NA
seqname	Bd1
strand	-
start	68434113
end	68435446
gene_length_bp	1334
n_transcripts	2
feature_counts	exon: 4; transcript: 2

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0934100.v1.2	NA	BdiBd21-3.1G0934100.1.v1.2	exon	phytozomev13	NA	NA	Bd1	68434115	68435129	-	1015
BdiBd21-3.1G0934100.v1.2	NA	BdiBd21-3.1G0934100.1.v1.2	exon	phytozomev13	NA	NA	Bd1	68435237	68435426	-	190
BdiBd21-3.1G0934100.v1.2	NA	BdiBd21-3.1G0934100.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	68434115	68435426	-	1312
BdiBd21-3.1G0934100.v1.2	NA	BdiBd21-3.1G0934100.2.v1.2	exon	phytozomev13	NA	NA	Bd1	68434113	68435126	-	1014
BdiBd21-3.1G0934100.v1.2	NA	BdiBd21-3.1G0934100.2.v1.2	exon	phytozomev13	NA	NA	Bd1	68435237	68435446	-	210
BdiBd21-3.1G0934100.v1.2	NA	BdiBd21-3.1G0934100.2.v1.2	transcript	phytozomev13	NA	NA	Bd1	68434113	68435446	-	1334

field	value
#pacId	PAC:42966208
locusName	BdiBd21-3.1G0934100
transcriptName	BdiBd21-3.1G0934100.1
peptideName	BdiBd21-3.1G0934100.1.p
Pfam	PF00314
Panther	PTHR31048:SF219
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	AT1G75050
Best-hit-arabi-defline	(1 of 3) PTHR31048:SF140 - PATHOGENESIS-RELATED PROTEIN 5-RELATED
Best-hit-clamy-name	Cre02.g102300
Best-hit-clamy-defline	(1 of 1) PTHR31013:SF2 - PROTEIN THN-1-RELATED
Best-hit-rice-name	LOC_Os03g13070
Best-hit-rice-defline	(1 of 1) PTHR31048:SF219 - OS03G0233200 PROTEIN
locus_clean	BdiBd21-3.1G0934100
transcript_clean	BdiBd21-3.1G0934100.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.1G0971000.v1.2
gene_name	NA
seqname	Bd1
strand	+
start	70732913
end	70734823
gene_length_bp	1911
n_transcripts	1
feature_counts	exon: 2; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.1G0971000.v1.2	NA	BdiBd21-3.1G0971000.1.v1.2	exon	phytozomev13	NA	NA	Bd1	70732913	70733363	+	451
BdiBd21-3.1G0971000.v1.2	NA	BdiBd21-3.1G0971000.1.v1.2	exon	phytozomev13	NA	NA	Bd1	70733484	70734823	+	1340
BdiBd21-3.1G0971000.v1.2	NA	BdiBd21-3.1G0971000.1.v1.2	transcript	phytozomev13	NA	NA	Bd1	70732913	70734823	+	1911

field	value
#pacId	PAC:42967984
locusName	BdiBd21-3.1G0971000
transcriptName	BdiBd21-3.1G0971000.1
peptideName	BdiBd21-3.1G0971000.1.p
Pfam	PF02458
Panther	PTHR31642:SF351
ec	NA
KOG	EC:2.3.1.138
KO	NA
GO	NA
Best-hit-arabi-name	AT5G48930
Best-hit-arabi-defline	(1 of 1) K13065 - shikimate O-hydroxycinnamoyltransferase (E2.3.1.133, HCT)
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os03g08720
Best-hit-rice-defline	(1 of 3) PTHR31642:SF351 - TRYPTAMINE BENZOYLTRANSFERASE 2
locus_clean	BdiBd21-3.1G0971000
transcript_clean	BdiBd21-3.1G0971000.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.2G0107700.v1.2
gene_name	NA
seqname	Bd2
strand	+
start	6563298
end	6564467
gene_length_bp	1170
n_transcripts	1
feature_counts	exon: 3; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0107700.v1.2	NA	BdiBd21-3.2G0107700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	6563298	6563614	+	317
BdiBd21-3.2G0107700.v1.2	NA	BdiBd21-3.2G0107700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	6563699	6563804	+	106
BdiBd21-3.2G0107700.v1.2	NA	BdiBd21-3.2G0107700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	6563914	6564467	+	554
BdiBd21-3.2G0107700.v1.2	NA	BdiBd21-3.2G0107700.1.v1.2	transcript	phytozomev13	NA	NA	Bd2	6563298	6564467	+	1170

field	value
#pacId	PAC:42978229
locusName	BdiBd21-3.2G0107700
transcriptName	BdiBd21-3.2G0107700.1
peptideName	BdiBd21-3.2G0107700.1.p
Pfam	PF04535
Panther	PTHR36488:SF8
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	AT4G03540
Best-hit-arabi-defline	(1 of 13) PTHR36488:SF8 - CASP-LIKE PROTEIN 1U1
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os01g13560
Best-hit-rice-defline	(1 of 11) PTHR36488:SF8 - CASP-LIKE PROTEIN 1U1
locus_clean	BdiBd21-3.2G0107700
transcript_clean	BdiBd21-3.2G0107700.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.2G0127300.v1.2
gene_name	NA
seqname	Bd2
strand	-
start	7793597
end	7795741
gene_length_bp	2145
n_transcripts	1
feature_counts	exon: 4; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0127300.v1.2	NA	BdiBd21-3.2G0127300.1.v1.2	exon	phytozomev13	NA	NA	Bd2	7793597	7794220	-	624
BdiBd21-3.2G0127300.v1.2	NA	BdiBd21-3.2G0127300.1.v1.2	exon	phytozomev13	NA	NA	Bd2	7794607	7794772	-	166
BdiBd21-3.2G0127300.v1.2	NA	BdiBd21-3.2G0127300.1.v1.2	exon	phytozomev13	NA	NA	Bd2	7794950	7795141	-	192
BdiBd21-3.2G0127300.v1.2	NA	BdiBd21-3.2G0127300.1.v1.2	exon	phytozomev13	NA	NA	Bd2	7795334	7795741	-	408
BdiBd21-3.2G0127300.v1.2	NA	BdiBd21-3.2G0127300.1.v1.2	transcript	phytozomev13	NA	NA	Bd2	7793597	7795741	-	2145

field	value
#pacId	PAC:42970124
locusName	BdiBd21-3.2G0127300
transcriptName	BdiBd21-3.2G0127300.1
peptideName	BdiBd21-3.2G0127300.1.p
Pfam	PF00141
Panther	PTHR31388:SF164
ec	NA
KOG	EC:1.11.1.7
KO	K00430
GO	GO:0004601 GO:0006979 GO:0020037
Best-hit-arabi-name	AT1G44970
Best-hit-arabi-defline	(1 of 1) PTHR31388:SF164 - PEROXIDASE 9
Best-hit-clamy-name	Cre06.g285150
Best-hit-clamy-defline	(1 of 3) 1.11.1.11 - L-ascorbate peroxidase. / ascorbic acid peroxidase.
Best-hit-rice-name	LOC_Os01g15810
Best-hit-rice-defline	(1 of 1) PTHR31388:SF164 - PEROXIDASE 9
locus_clean	BdiBd21-3.2G0127300
transcript_clean	BdiBd21-3.2G0127300.1

field	value
locusName	BdiBd21-3.2G0127300
transcriptName	BdiBd21-3.2G0127300.1
peptideName	BdiBd21-3.2G0127300.1.p
go_id	GO:0004601; GO:0006979; GO:0020037
TERM	peroxidase activity; response to oxidative stress; heme binding
ONTOLOGY	MF; BP
DEFINITION	Catalysis of the reaction: a donor + a peroxide = an oxidized donor + 2 H2O.; Any process that results in a change in state or activity of a cell or an organism (in terms of movement, secretion, enzyme production, gene expression, etc.) as a result of oxidative stress, a state often resulting from exposure to high levels of reactive oxygen species, e.g. superoxide anions, hydrogen peroxide (H2O2), and hydroxyl radicals.; Binding to a heme, a compound composed of iron complexed in a porphyrin (tetrapyrrole) ring.

key	value
gene_id	BdiBd21-3.2G0228600.v1.2
gene_name	NA
seqname	Bd2
strand	-
start	15325424
end	15328045
gene_length_bp	2622
n_transcripts	1
feature_counts	exon: 7; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0228600.v1.2	NA	BdiBd21-3.2G0228600.2.v1.2	exon	phytozomev13	NA	NA	Bd2	15325424	15326051	-	628
BdiBd21-3.2G0228600.v1.2	NA	BdiBd21-3.2G0228600.2.v1.2	exon	phytozomev13	NA	NA	Bd2	15326132	15326224	-	93
BdiBd21-3.2G0228600.v1.2	NA	BdiBd21-3.2G0228600.2.v1.2	exon	phytozomev13	NA	NA	Bd2	15326324	15326404	-	81
BdiBd21-3.2G0228600.v1.2	NA	BdiBd21-3.2G0228600.2.v1.2	exon	phytozomev13	NA	NA	Bd2	15326499	15326604	-	106
BdiBd21-3.2G0228600.v1.2	NA	BdiBd21-3.2G0228600.2.v1.2	exon	phytozomev13	NA	NA	Bd2	15326711	15326778	-	68
BdiBd21-3.2G0228600.v1.2	NA	BdiBd21-3.2G0228600.2.v1.2	exon	phytozomev13	NA	NA	Bd2	15326884	15326955	-	72
BdiBd21-3.2G0228600.v1.2	NA	BdiBd21-3.2G0228600.2.v1.2	exon	phytozomev13	NA	NA	Bd2	15327064	15328045	-	982
BdiBd21-3.2G0228600.v1.2	NA	BdiBd21-3.2G0228600.2.v1.2	transcript	phytozomev13	NA	NA	Bd2	15325424	15328045	-	2622

field	value
#pacId	PAC:42975108
locusName	BdiBd21-3.2G0228600
transcriptName	BdiBd21-3.2G0228600.2
peptideName	BdiBd21-3.2G0228600.2.p
Pfam	PF12428 PF12906
Panther	PTHR23012:SF164
ec	NA
KOG	EC:2.3.2.27
KO	NA
GO	GO:0008270
Best-hit-arabi-name	AT2G01275
Best-hit-arabi-defline	(1 of 1) PTHR23012:SF93 - RING/FYVE/PHD ZINC FINGER-CONTAINING PROTEIN
Best-hit-clamy-name	Cre09.g400738
Best-hit-clamy-defline	(1 of 1) PTHR23012:SF217 - RING_FYVE_PHD ZINC FINGER SUPERFAMILY PROTEIN
Best-hit-rice-name	LOC_Os05g47900
Best-hit-rice-defline	(1 of 1) PTHR23012:SF164 - OS05G0552400 PROTEIN
locus_clean	BdiBd21-3.2G0228600
transcript_clean	BdiBd21-3.2G0228600.2

field	value
locusName	BdiBd21-3.2G0228600
transcriptName	BdiBd21-3.2G0228600.2
peptideName	BdiBd21-3.2G0228600.2.p
go_id	GO:0008270
TERM	zinc ion binding
ONTOLOGY	MF
DEFINITION	Binding to a zinc ion (Zn).

key	value
gene_id	BdiBd21-3.2G0308600.v1.2
gene_name	NA
seqname	Bd2
strand	-
start	20879287
end	20881655
gene_length_bp	2369
n_transcripts	1
feature_counts	exon: 4; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0308600.v1.2	NA	BdiBd21-3.2G0308600.1.v1.2	exon	phytozomev13	NA	NA	Bd2	20879287	20879432	-	146
BdiBd21-3.2G0308600.v1.2	NA	BdiBd21-3.2G0308600.1.v1.2	exon	phytozomev13	NA	NA	Bd2	20879473	20879746	-	274
BdiBd21-3.2G0308600.v1.2	NA	BdiBd21-3.2G0308600.1.v1.2	exon	phytozomev13	NA	NA	Bd2	20880560	20880699	-	140
BdiBd21-3.2G0308600.v1.2	NA	BdiBd21-3.2G0308600.1.v1.2	exon	phytozomev13	NA	NA	Bd2	20881142	20881655	-	514
BdiBd21-3.2G0308600.v1.2	NA	BdiBd21-3.2G0308600.1.v1.2	transcript	phytozomev13	NA	NA	Bd2	20879287	20881655	-	2369

field	value
#pacId	PAC:42978838
locusName	BdiBd21-3.2G0308600
transcriptName	BdiBd21-3.2G0308600.1
peptideName	BdiBd21-3.2G0308600.1.p
Pfam	PF04434
Panther	PTHR31669:SF296
ec	NA
KOG	NA
KO	NA
GO	GO:0008270
Best-hit-arabi-name	AT4G15090
Best-hit-arabi-defline	(1 of 1) PTHR31669:SF21 - PROTEIN FAR-RED IMPAIRED RESPONSE 1
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os09g01780
Best-hit-rice-defline	(1 of 4) PTHR31669:SF296 - PROTEIN FAR1-RELATED SEQUENCE
locus_clean	BdiBd21-3.2G0308600
transcript_clean	BdiBd21-3.2G0308600.1

field	value
locusName	BdiBd21-3.2G0308600
transcriptName	BdiBd21-3.2G0308600.1
peptideName	BdiBd21-3.2G0308600.1.p
go_id	GO:0008270
TERM	zinc ion binding
ONTOLOGY	MF
DEFINITION	Binding to a zinc ion (Zn).

key	value
gene_id	BdiBd21-3.2G0593700.v1.2
gene_name	NA
seqname	Bd2
strand	+
start	46405432
end	46408110
gene_length_bp	2679
n_transcripts	2
feature_counts	exon: 18; transcript: 2

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	46405520	46405774	+	255
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	46405958	46406034	+	77
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	46406274	46406502	+	229
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	46406701	46406855	+	155
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	46406951	46406996	+	46
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	46407098	46407189	+	92
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	46407281	46407377	+	97
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	46407487	46407543	+	57
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.1.v1.2	exon	phytozomev13	NA	NA	Bd2	46407628	46408110	+	483
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.1.v1.2	transcript	phytozomev13	NA	NA	Bd2	46405520	46408110	+	2591
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.2.v1.2	exon	phytozomev13	NA	NA	Bd2	46405432	46405774	+	343
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.2.v1.2	exon	phytozomev13	NA	NA	Bd2	46405958	46406034	+	77
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.2.v1.2	exon	phytozomev13	NA	NA	Bd2	46406274	46406502	+	229
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.2.v1.2	exon	phytozomev13	NA	NA	Bd2	46406701	46406855	+	155
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.2.v1.2	exon	phytozomev13	NA	NA	Bd2	46406951	46406996	+	46
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.2.v1.2	exon	phytozomev13	NA	NA	Bd2	46407098	46407189	+	92
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.2.v1.2	exon	phytozomev13	NA	NA	Bd2	46407281	46407377	+	97
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.2.v1.2	exon	phytozomev13	NA	NA	Bd2	46407487	46407543	+	57
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.2.v1.2	exon	phytozomev13	NA	NA	Bd2	46407643	46408110	+	468
BdiBd21-3.2G0593700.v1.2	NA	BdiBd21-3.2G0593700.2.v1.2	transcript	phytozomev13	NA	NA	Bd2	46405432	46408110	+	2679

field	value
#pacId	PAC:42973964
locusName	BdiBd21-3.2G0593700
transcriptName	BdiBd21-3.2G0593700.1
peptideName	BdiBd21-3.2G0593700.1.p
Pfam	NA
Panther	PTHR36329:SF1
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	AT1G52155
Best-hit-arabi-defline	NA
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os01g48570
Best-hit-rice-defline	(1 of 1644) 2.7.11.1 - non-specific serine/threonine protein kinase. / threonine-specific protein kinase.
locus_clean	BdiBd21-3.2G0593700
transcript_clean	BdiBd21-3.2G0593700.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.2G0608366.v1.2
gene_name	NA
seqname	Bd2
strand	+
start	47433862
end	47439571
gene_length_bp	5710
n_transcripts	1
feature_counts	exon: 9; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0608366.v1.2	NA	BdiBd21-3.2G0608366.1.v1.2	exon	phytozomev13	NA	NA	Bd2	47433862	47434699	+	838
BdiBd21-3.2G0608366.v1.2	NA	BdiBd21-3.2G0608366.1.v1.2	exon	phytozomev13	NA	NA	Bd2	47434778	47434837	+	60
BdiBd21-3.2G0608366.v1.2	NA	BdiBd21-3.2G0608366.1.v1.2	exon	phytozomev13	NA	NA	Bd2	47435180	47435262	+	83
BdiBd21-3.2G0608366.v1.2	NA	BdiBd21-3.2G0608366.1.v1.2	exon	phytozomev13	NA	NA	Bd2	47435478	47435640	+	163
BdiBd21-3.2G0608366.v1.2	NA	BdiBd21-3.2G0608366.1.v1.2	exon	phytozomev13	NA	NA	Bd2	47435735	47435864	+	130
BdiBd21-3.2G0608366.v1.2	NA	BdiBd21-3.2G0608366.1.v1.2	exon	phytozomev13	NA	NA	Bd2	47437612	47437770	+	159
BdiBd21-3.2G0608366.v1.2	NA	BdiBd21-3.2G0608366.1.v1.2	exon	phytozomev13	NA	NA	Bd2	47437852	47438024	+	173
BdiBd21-3.2G0608366.v1.2	NA	BdiBd21-3.2G0608366.1.v1.2	exon	phytozomev13	NA	NA	Bd2	47438124	47438204	+	81
BdiBd21-3.2G0608366.v1.2	NA	BdiBd21-3.2G0608366.1.v1.2	exon	phytozomev13	NA	NA	Bd2	47439216	47439571	+	356
BdiBd21-3.2G0608366.v1.2	NA	BdiBd21-3.2G0608366.1.v1.2	transcript	phytozomev13	NA	NA	Bd2	47433862	47439571	+	5710

field	value
#pacId	PAC:42969143
locusName	BdiBd21-3.2G0608366
transcriptName	BdiBd21-3.2G0608366.1
peptideName	BdiBd21-3.2G0608366.1.p
Pfam	PF00226 PF14308
Panther	PTHR44094:SF6
ec	KOG0691
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	AT4G39150
Best-hit-arabi-defline	(1 of 1) PTHR44094:SF23 - J DOMAIN-CONTAINING PROTEIN
Best-hit-clamy-name	Cre06.g260350
Best-hit-clamy-defline	(1 of 1) PTHR44094:SF8 - J DOMAIN-CONTAINING PROTEIN
Best-hit-rice-name	LOC_Os01g50700
Best-hit-rice-defline	(1 of 1) PTHR44094:SF6 - OS01G0702450 PROTEIN
locus_clean	BdiBd21-3.2G0608366
transcript_clean	BdiBd21-3.2G0608366.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.2G0651101.v1.2
gene_name	NA
seqname	Bd2
strand	-
start	50109320
end	50110653
gene_length_bp	1334
n_transcripts	1
feature_counts	exon: 1; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0651101.v1.2	NA	BdiBd21-3.2G0651101.1.v1.2	exon	phytozomev13	NA	NA	Bd2	50109320	50110653	-	1334
BdiBd21-3.2G0651101.v1.2	NA	BdiBd21-3.2G0651101.1.v1.2	transcript	phytozomev13	NA	NA	Bd2	50109320	50110653	-	1334

field	value
#pacId	PAC:42972491
locusName	BdiBd21-3.2G0651101
transcriptName	BdiBd21-3.2G0651101.1
peptideName	BdiBd21-3.2G0651101.1.p
Pfam	PF00036 PF13833
Panther	PTHR10891:SF1008
ec	KOG0027
KOG	NA
KO	K13448
GO	GO:0005509
Best-hit-arabi-name	AT3G50770
Best-hit-arabi-defline	(1 of 1) PTHR23050:SF390 - CALCIUM-BINDING PROTEIN CML41-RELATED
Best-hit-clamy-name	Cre03.g178350
Best-hit-clamy-defline	(1 of 3) PTHR23050:SF523 - AT16150P-RELATED
Best-hit-rice-name	LOC_Os01g56030
Best-hit-rice-defline	(1 of 1) PF13405//PF13833 - EF-hand domain (EF-hand_6) // EF-hand domain pair (EF-hand_8)
locus_clean	BdiBd21-3.2G0651101
transcript_clean	BdiBd21-3.2G0651101.1

field	value
locusName	BdiBd21-3.2G0651101
transcriptName	BdiBd21-3.2G0651101.1
peptideName	BdiBd21-3.2G0651101.1.p
go_id	GO:0005509
TERM	calcium ion binding
ONTOLOGY	MF
DEFINITION	Binding to a calcium ion (Ca2+).

key	value
gene_id	BdiBd21-3.2G0681800.v1.2
gene_name	NA
seqname	Bd2
strand	+
start	51927156
end	51933373
gene_length_bp	6218
n_transcripts	2
feature_counts	exon: 39; transcript: 2

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51927156	51927312	+	157
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51927426	51927656	+	231
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51928192	51928312	+	121
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51928391	51928462	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51928629	51928703	+	75
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51928801	51928872	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51928967	51929128	+	162
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51929238	51929309	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51929390	51929461	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51929553	51929624	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51929710	51929778	+	69
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51929857	51929931	+	75
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51930397	51930468	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51930706	51930840	+	135
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51930920	51931389	+	470
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51931461	51931619	+	159
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51931821	51931960	+	140
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51932042	51932261	+	220
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51932355	51932590	+	236
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51932678	51933373	+	696
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.1.v1.2	transcript	phytozomev13	NA	NA	Bd2	51927156	51933373	+	6218
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51927381	51927656	+	276
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51928192	51928312	+	121
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51928391	51928462	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51928629	51928703	+	75
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51928801	51928872	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51928967	51929128	+	162
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51929238	51929309	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51929390	51929461	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51929553	51929624	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51929710	51929778	+	69
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51929857	51929931	+	75
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51930397	51930468	+	72
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51930706	51930840	+	135
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51930920	51931389	+	470
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51931461	51931619	+	159
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51931821	51931960	+	140
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51932042	51932261	+	220
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51932355	51932590	+	236
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51932678	51933373	+	696
BdiBd21-3.2G0681800.v1.2	NA	BdiBd21-3.2G0681800.2.v1.2	transcript	phytozomev13	NA	NA	Bd2	51927381	51933373	+	5993

field	value
#pacId	PAC:42974660
locusName	BdiBd21-3.2G0681800
transcriptName	BdiBd21-3.2G0681800.1
peptideName	BdiBd21-3.2G0681800.1.p
Pfam	PF00560 PF07714 PF08263
Panther	PTHR48056:SF81
ec	KOG1187
KOG	EC:2.7.11.1
KO	NA
GO	GO:0004672 GO:0004713 GO:0005515 GO:0005524 GO:0006468
Best-hit-arabi-name	AT1G79620
Best-hit-arabi-defline	(1 of 1) PTHR45974:SF242 - LEUCINE-RICH REPEAT PROTEIN KINASE FAMILY PROTEIN
Best-hit-clamy-name	Cre12.g532050
Best-hit-clamy-defline	(1 of 3) 2.3.2.27//2.7.11.1 - RING-type E3 ubiquitin transferase. / ubiquitin transferase RING E3. // non-specific serine/threonine protein kinase. / threonine-specific protein kinase.
Best-hit-rice-name	LOC_Os01g60060
Best-hit-rice-defline	(1 of 1) PTHR45974:SF207 - LEUCINE-RICH REPEAT PROTEIN KINASE FAMILY PROTEIN
locus_clean	BdiBd21-3.2G0681800
transcript_clean	BdiBd21-3.2G0681800.1

field	value
locusName	BdiBd21-3.2G0681800
transcriptName	BdiBd21-3.2G0681800.1; BdiBd21-3.2G0681800.2
peptideName	BdiBd21-3.2G0681800.1.p; BdiBd21-3.2G0681800.2.p
go_id	GO:0004672; GO:0004713; GO:0005515; GO:0005524; GO:0006468
TERM	protein kinase activity; protein tyrosine kinase activity; protein binding; ATP binding; protein phosphorylation
ONTOLOGY	MF; BP
DEFINITION	Catalysis of the phosphorylation of an amino acid residue in a protein, usually according to the reaction: a protein + ATP = a phosphoprotein + ADP.; Catalysis of the reaction: ATP + a protein tyrosine = ADP + protein tyrosine phosphate.; Binding to a protein.; Binding to ATP, adenosine 5’-triphosphate, a universally important coenzyme and enzyme regulator.; The process of introducing a phosphate group on to a protein.

key	value
gene_id	BdiBd21-3.2G0681900.v1.2
gene_name	NA
seqname	Bd2
strand	+
start	51934460
end	51940387
gene_length_bp	5928
n_transcripts	2
feature_counts	exon: 34; transcript: 2

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51934541	51934625	+	85
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51935048	51935177	+	130
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51935247	51935318	+	72
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51935632	51935706	+	75
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51935796	51935864	+	69
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51935980	51936141	+	162
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51936260	51936331	+	72
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51936362	51936475	+	114
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51936551	51936622	+	72
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51936701	51936769	+	69
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51936844	51936918	+	75
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51937042	51937113	+	72
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51937201	51937335	+	135
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51937427	51937908	+	482
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51937980	51938138	+	159
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51938968	51939107	+	140
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51939187	51939406	+	220
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51939492	51939724	+	233
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	exon	phytozomev13	NA	NA	Bd2	51939815	51940387	+	573
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.1.v1.2	transcript	phytozomev13	NA	NA	Bd2	51934541	51940387	+	5847
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51934460	51934625	+	166
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51935048	51935177	+	130
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51935247	51935318	+	72
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51935632	51935706	+	75
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51935796	51935864	+	69
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51935980	51936141	+	162
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51936260	51936331	+	72
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51936404	51936475	+	72
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51936551	51936622	+	72
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51936701	51936769	+	69
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51936844	51936918	+	75
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51937042	51937113	+	72
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51937197	51937335	+	139
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51937427	51937908	+	482
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	exon	phytozomev13	NA	NA	Bd2	51937980	51938137	+	158
BdiBd21-3.2G0681900.v1.2	NA	BdiBd21-3.2G0681900.2.v1.2	transcript	phytozomev13	NA	NA	Bd2	51934460	51938137	+	3678

field	value
#pacId	PAC:42968805
locusName	BdiBd21-3.2G0681900
transcriptName	BdiBd21-3.2G0681900.1
peptideName	BdiBd21-3.2G0681900.1.p
Pfam	PF00560 PF07714 PF08263
Panther	PTHR45974:SF295
ec	KOG1187
KOG	EC:2.7.11.1
KO	NA
GO	GO:0004672 GO:0004713 GO:0005515 GO:0005524 GO:0006468
Best-hit-arabi-name	AT1G79620
Best-hit-arabi-defline	(1 of 1) PTHR45974:SF242 - LEUCINE-RICH REPEAT PROTEIN KINASE FAMILY PROTEIN
Best-hit-clamy-name	Cre12.g532050
Best-hit-clamy-defline	(1 of 3) 2.3.2.27//2.7.11.1 - RING-type E3 ubiquitin transferase. / ubiquitin transferase RING E3. // non-specific serine/threonine protein kinase. / threonine-specific protein kinase.
Best-hit-rice-name	LOC_Os05g40770
Best-hit-rice-defline	(1 of 1) PTHR45974:SF229 - OS05G0486100 PROTEIN
locus_clean	BdiBd21-3.2G0681900
transcript_clean	BdiBd21-3.2G0681900.1

field	value
locusName	BdiBd21-3.2G0681900
transcriptName	BdiBd21-3.2G0681900.1; BdiBd21-3.2G0681900.2
peptideName	BdiBd21-3.2G0681900.1.p; BdiBd21-3.2G0681900.2.p
go_id	GO:0004672; GO:0004713; GO:0005515; GO:0005524; GO:0006468
TERM	protein kinase activity; protein tyrosine kinase activity; protein binding; ATP binding; protein phosphorylation
ONTOLOGY	MF; BP
DEFINITION	Catalysis of the phosphorylation of an amino acid residue in a protein, usually according to the reaction: a protein + ATP = a phosphoprotein + ADP.; Catalysis of the reaction: ATP + a protein tyrosine = ADP + protein tyrosine phosphate.; Binding to a protein.; Binding to ATP, adenosine 5’-triphosphate, a universally important coenzyme and enzyme regulator.; The process of introducing a phosphate group on to a protein.

key	value
gene_id	BdiBd21-3.2G0698500.v1.2
gene_name	NA
seqname	Bd2
strand	+
start	52963651
end	52966243
gene_length_bp	2593
n_transcripts	1
feature_counts	exon: 4; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0698500.v1.2	NA	BdiBd21-3.2G0698500.1.v1.2	exon	phytozomev13	NA	NA	Bd2	52963651	52964405	+	755
BdiBd21-3.2G0698500.v1.2	NA	BdiBd21-3.2G0698500.1.v1.2	exon	phytozomev13	NA	NA	Bd2	52964553	52964675	+	123
BdiBd21-3.2G0698500.v1.2	NA	BdiBd21-3.2G0698500.1.v1.2	exon	phytozomev13	NA	NA	Bd2	52964808	52964969	+	162
BdiBd21-3.2G0698500.v1.2	NA	BdiBd21-3.2G0698500.1.v1.2	exon	phytozomev13	NA	NA	Bd2	52965064	52966243	+	1180
BdiBd21-3.2G0698500.v1.2	NA	BdiBd21-3.2G0698500.1.v1.2	transcript	phytozomev13	NA	NA	Bd2	52963651	52966243	+	2593

field	value
#pacId	PAC:42974040
locusName	BdiBd21-3.2G0698500
transcriptName	BdiBd21-3.2G0698500.1
peptideName	BdiBd21-3.2G0698500.1.p
Pfam	PF01417
Panther	PTHR12276:SF116
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	AT3G46540
Best-hit-arabi-defline	(1 of 1) PTHR12276:SF116 - ENTH_VHS FAMILY PROTEIN
Best-hit-clamy-name	Cre16.g664450
Best-hit-clamy-defline	(1 of 1) PTHR12276:SF45 - CLATHRIN INTERACTOR 1
Best-hit-rice-name	LOC_Os01g62370
Best-hit-rice-defline	(1 of 1) PTHR12276:SF116 - ENTH_VHS FAMILY PROTEIN
locus_clean	BdiBd21-3.2G0698500
transcript_clean	BdiBd21-3.2G0698500.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.2G0739000.v1.2
gene_name	NA
seqname	Bd2
strand	-
start	55329136
end	55331303
gene_length_bp	2168
n_transcripts	1
feature_counts	exon: 3; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0739000.v1.2	NA	BdiBd21-3.2G0739000.2.v1.2	exon	phytozomev13	NA	NA	Bd2	55329136	55329540	-	405
BdiBd21-3.2G0739000.v1.2	NA	BdiBd21-3.2G0739000.2.v1.2	exon	phytozomev13	NA	NA	Bd2	55329640	55330596	-	957
BdiBd21-3.2G0739000.v1.2	NA	BdiBd21-3.2G0739000.2.v1.2	exon	phytozomev13	NA	NA	Bd2	55331043	55331303	-	261
BdiBd21-3.2G0739000.v1.2	NA	BdiBd21-3.2G0739000.2.v1.2	transcript	phytozomev13	NA	NA	Bd2	55329136	55331303	-	2168

field	value
#pacId	PAC:42975530
locusName	BdiBd21-3.2G0739000
transcriptName	BdiBd21-3.2G0739000.2
peptideName	BdiBd21-3.2G0739000.2.p
Pfam	PF01190
Panther	PTHR33470:SF27
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	NA
Best-hit-arabi-defline	NA
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os01g67390
Best-hit-rice-defline	(1 of 1) PTHR33470:SF27 - OS01G0899700 PROTEIN
locus_clean	BdiBd21-3.2G0739000
transcript_clean	BdiBd21-3.2G0739000.2

table vide/incorrecte

key	value
gene_id	BdiBd21-3.2G0799100.v1.2
gene_name	NA
seqname	Bd2
strand	+
start	58464986
end	58467953
gene_length_bp	2968
n_transcripts	2
feature_counts	exon: 7; transcript: 2

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.2G0799100.v1.2	NA	BdiBd21-3.2G0799100.1.v1.2	exon	phytozomev13	NA	NA	Bd2	58464986	58465681	+	696
BdiBd21-3.2G0799100.v1.2	NA	BdiBd21-3.2G0799100.1.v1.2	exon	phytozomev13	NA	NA	Bd2	58465825	58465968	+	144
BdiBd21-3.2G0799100.v1.2	NA	BdiBd21-3.2G0799100.1.v1.2	exon	phytozomev13	NA	NA	Bd2	58466829	58467953	+	1125
BdiBd21-3.2G0799100.v1.2	NA	BdiBd21-3.2G0799100.1.v1.2	transcript	phytozomev13	NA	NA	Bd2	58464986	58467953	+	2968
BdiBd21-3.2G0799100.v1.2	NA	BdiBd21-3.2G0799100.2.v1.2	exon	phytozomev13	NA	NA	Bd2	58465149	58465254	+	106
BdiBd21-3.2G0799100.v1.2	NA	BdiBd21-3.2G0799100.2.v1.2	exon	phytozomev13	NA	NA	Bd2	58465362	58465681	+	320
BdiBd21-3.2G0799100.v1.2	NA	BdiBd21-3.2G0799100.2.v1.2	exon	phytozomev13	NA	NA	Bd2	58465825	58465968	+	144
BdiBd21-3.2G0799100.v1.2	NA	BdiBd21-3.2G0799100.2.v1.2	exon	phytozomev13	NA	NA	Bd2	58466829	58467939	+	1111
BdiBd21-3.2G0799100.v1.2	NA	BdiBd21-3.2G0799100.2.v1.2	transcript	phytozomev13	NA	NA	Bd2	58465149	58467939	+	2791

field	value
#pacId	PAC:42973558
locusName	BdiBd21-3.2G0799100
transcriptName	BdiBd21-3.2G0799100.1
peptideName	BdiBd21-3.2G0799100.1.p
Pfam	PF03106
Panther	PTHR31221:SF42
ec	NA
KOG	NA
KO	NA
GO	GO:0003700 GO:0006355 GO:0043565
Best-hit-arabi-name	AT5G43290
Best-hit-arabi-defline	(1 of 3) PTHR32096:SF18 - DISEASE RESISTANCE PROTEIN-LIKE-RELATED
Best-hit-clamy-name	Cre04.g228400
Best-hit-clamy-defline	(1 of 1) PTHR32096:SF137 - WRKY DOMAIN-CONTAINING PROTEIN
Best-hit-rice-name	LOC_Os01g74140
Best-hit-rice-defline	(1 of 1) PTHR31221:SF42 - WRKY TRANSCRIPTION FACTOR 49-RELATED
locus_clean	BdiBd21-3.2G0799100
transcript_clean	BdiBd21-3.2G0799100.1

field	value
locusName	BdiBd21-3.2G0799100
transcriptName	BdiBd21-3.2G0799100.1; BdiBd21-3.2G0799100.2
peptideName	BdiBd21-3.2G0799100.1.p; BdiBd21-3.2G0799100.2.p
go_id	GO:0003700; GO:0006355; GO:0043565
TERM	DNA-binding transcription factor activity; regulation of DNA-templated transcription; sequence-specific DNA binding
ONTOLOGY	MF; BP
DEFINITION	A transcription regulator activity that modulates transcription of gene sets via selective and non-covalent binding to a specific double-stranded genomic DNA sequence (sometimes referred to as a motif) within a cis-regulatory region. Regulatory regions include promoters (proximal and distal) and enhancers. Genes are transcriptional units, and include bacterial operons.; Any process that modulates the frequency, rate or extent of cellular DNA-templated transcription.; Binding to DNA of a specific nucleotide composition, e.g. GC-rich DNA binding, or with a specific sequence motif or type of DNA e.g. promotor binding or rDNA binding.

key	value
gene_id	BdiBd21-3.3G0107501.v1.2
gene_name	NA
seqname	Bd3
strand	+
start	6368068
end	6369288
gene_length_bp	1221
n_transcripts	1
feature_counts	exon: 1; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.3G0107501.v1.2	NA	BdiBd21-3.3G0107501.1.v1.2	exon	phytozomev13	NA	NA	Bd3	6368068	6369288	+	1221
BdiBd21-3.3G0107501.v1.2	NA	BdiBd21-3.3G0107501.1.v1.2	transcript	phytozomev13	NA	NA	Bd3	6368068	6369288	+	1221

field	value
#pacId	PAC:42981600
locusName	BdiBd21-3.3G0107501
transcriptName	BdiBd21-3.3G0107501.1
peptideName	BdiBd21-3.3G0107501.1.p
Pfam	NA
Panther	PTHR33237:SF4
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	AT1G71740
Best-hit-arabi-defline	(1 of 1) PTHR33237:SF4 - F14O23.12
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os02g11950
Best-hit-rice-defline	(1 of 1) PTHR33237:SF4 - F14O23.12
locus_clean	BdiBd21-3.3G0107501
transcript_clean	BdiBd21-3.3G0107501.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.3G0171800.v1.2
gene_name	NA
seqname	Bd3
strand	+
start	11805987
end	11807919
gene_length_bp	1933
n_transcripts	1
feature_counts	exon: 2; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.3G0171800.v1.2	NA	BdiBd21-3.3G0171800.1.v1.2	exon	phytozomev13	NA	NA	Bd3	11805987	11806982	+	996
BdiBd21-3.3G0171800.v1.2	NA	BdiBd21-3.3G0171800.1.v1.2	exon	phytozomev13	NA	NA	Bd3	11807084	11807919	+	836
BdiBd21-3.3G0171800.v1.2	NA	BdiBd21-3.3G0171800.1.v1.2	transcript	phytozomev13	NA	NA	Bd3	11805987	11807919	+	1933

field	value
#pacId	PAC:42990632
locusName	BdiBd21-3.3G0171800
transcriptName	BdiBd21-3.3G0171800.1
peptideName	BdiBd21-3.3G0171800.1.p
Pfam	PF04535
Panther	PTHR36488:SF8
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	AT5G06200
Best-hit-arabi-defline	(1 of 13) PTHR36488:SF8 - CASP-LIKE PROTEIN 1U1
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os08g01160
Best-hit-rice-defline	(1 of 11) PTHR36488:SF8 - CASP-LIKE PROTEIN 1U1
locus_clean	BdiBd21-3.3G0171800
transcript_clean	BdiBd21-3.3G0171800.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.3G0291100.v1.2
gene_name	NA
seqname	Bd3
strand	+
start	20237951
end	20239249
gene_length_bp	1299
n_transcripts	1
feature_counts	exon: 1; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.3G0291100.v1.2	NA	BdiBd21-3.3G0291100.1.v1.2	exon	phytozomev13	NA	NA	Bd3	20237951	20239249	+	1299
BdiBd21-3.3G0291100.v1.2	NA	BdiBd21-3.3G0291100.1.v1.2	transcript	phytozomev13	NA	NA	Bd3	20237951	20239249	+	1299

field	value
#pacId	PAC:42983070
locusName	BdiBd21-3.3G0291100
transcriptName	BdiBd21-3.3G0291100.1
peptideName	BdiBd21-3.3G0291100.1.p
Pfam	NA
Panther	PTHR36481:SF3
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	NA
Best-hit-arabi-defline	NA
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os10g06680
Best-hit-rice-defline	(1 of 136) IPR036426 - Bulb-type lectin domain superfamily
locus_clean	BdiBd21-3.3G0291100
transcript_clean	BdiBd21-3.3G0291100.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.3G0383000.v1.2
gene_name	NA
seqname	Bd3
strand	-
start	31363408
end	31367085
gene_length_bp	3678
n_transcripts	1
feature_counts	exon: 2; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.3G0383000.v1.2	NA	BdiBd21-3.3G0383000.1.v1.2	exon	phytozomev13	NA	NA	Bd3	31363408	31364640	-	1233
BdiBd21-3.3G0383000.v1.2	NA	BdiBd21-3.3G0383000.1.v1.2	exon	phytozomev13	NA	NA	Bd3	31365522	31367085	-	1564
BdiBd21-3.3G0383000.v1.2	NA	BdiBd21-3.3G0383000.1.v1.2	transcript	phytozomev13	NA	NA	Bd3	31363408	31367085	-	3678

field	value
#pacId	PAC:42990880
locusName	BdiBd21-3.3G0383000
transcriptName	BdiBd21-3.3G0383000.1
peptideName	BdiBd21-3.3G0383000.1.p
Pfam	PF00067
Panther	PTHR24296:SF3
ec	KOG0157
KOG	EC:1.14.15.3
KO	K15402
GO	GO:0004497 GO:0005506 GO:0016705 GO:0020037
Best-hit-arabi-name	AT5G23190
Best-hit-arabi-defline	(1 of 2) PTHR24296:SF3 - CYTOCHROME P450 86B1-RELATED
Best-hit-clamy-name	Cre01.g003850
Best-hit-clamy-defline	(1 of 2) PTHR24291:SF189 - CYTOCHROME P450 4V2
Best-hit-rice-name	LOC_Os10g34480
Best-hit-rice-defline	(1 of 1) PTHR24296:SF3 - CYTOCHROME P450 86B1-RELATED
locus_clean	BdiBd21-3.3G0383000
transcript_clean	BdiBd21-3.3G0383000.1

field	value
locusName	BdiBd21-3.3G0383000
transcriptName	BdiBd21-3.3G0383000.1
peptideName	BdiBd21-3.3G0383000.1.p
go_id	GO:0004497; GO:0005506; GO:0016705; GO:0020037
TERM	monooxygenase activity; iron ion binding; oxidoreductase activity, acting on paired donors, with incorporation or reduction of molecular oxygen; heme binding
ONTOLOGY	MF
DEFINITION	Catalysis of the incorporation of one atom of molecular oxygen (O2) into the substrate and the reduction of the other atom of O2 to water.; Binding to an iron (Fe) ion.; Catalysis of an oxidation-reduction (redox) reaction in which hydrogen or electrons are transferred from each of two donors, and molecular oxygen is reduced or incorporated into a donor.; Binding to a heme, a compound composed of iron complexed in a porphyrin (tetrapyrrole) ring.

key	value
gene_id	BdiBd21-3.3G0499200.v1.2
gene_name	NA
seqname	Bd3
strand	-
start	40325708
end	40328336
gene_length_bp	2629
n_transcripts	1
feature_counts	exon: 5; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.3G0499200.v1.2	NA	BdiBd21-3.3G0499200.1.v1.2	exon	phytozomev13	NA	NA	Bd3	40325708	40326782	-	1075
BdiBd21-3.3G0499200.v1.2	NA	BdiBd21-3.3G0499200.1.v1.2	exon	phytozomev13	NA	NA	Bd3	40326868	40327068	-	201
BdiBd21-3.3G0499200.v1.2	NA	BdiBd21-3.3G0499200.1.v1.2	exon	phytozomev13	NA	NA	Bd3	40327545	40327635	-	91
BdiBd21-3.3G0499200.v1.2	NA	BdiBd21-3.3G0499200.1.v1.2	exon	phytozomev13	NA	NA	Bd3	40327718	40327800	-	83
BdiBd21-3.3G0499200.v1.2	NA	BdiBd21-3.3G0499200.1.v1.2	exon	phytozomev13	NA	NA	Bd3	40327895	40328336	-	442
BdiBd21-3.3G0499200.v1.2	NA	BdiBd21-3.3G0499200.1.v1.2	transcript	phytozomev13	NA	NA	Bd3	40325708	40328336	-	2629

field	value
#pacId	PAC:42981882
locusName	BdiBd21-3.3G0499200
transcriptName	BdiBd21-3.3G0499200.1
peptideName	BdiBd21-3.3G0499200.1.p
Pfam	NA
Panther	PTHR33385:SF17
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	AT1G14630
Best-hit-arabi-defline	(1 of 2) PTHR33385:SF18 - XRI1-LIKE PROTEIN
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os08g36380
Best-hit-rice-defline	(1 of 1) PTHR33385:SF17 - OS08G0466800 PROTEIN
locus_clean	BdiBd21-3.3G0499200
transcript_clean	BdiBd21-3.3G0499200.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.3G0639132.v1.2
gene_name	NA
seqname	Bd3
strand	+
start	49561897
end	49563872
gene_length_bp	1976
n_transcripts	1
feature_counts	exon: 5; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.3G0639132.v1.2	NA	BdiBd21-3.3G0639132.1.v1.2	exon	phytozomev13	NA	NA	Bd3	49561897	49562188	+	292
BdiBd21-3.3G0639132.v1.2	NA	BdiBd21-3.3G0639132.1.v1.2	exon	phytozomev13	NA	NA	Bd3	49562320	49562523	+	204
BdiBd21-3.3G0639132.v1.2	NA	BdiBd21-3.3G0639132.1.v1.2	exon	phytozomev13	NA	NA	Bd3	49562686	49562858	+	173
BdiBd21-3.3G0639132.v1.2	NA	BdiBd21-3.3G0639132.1.v1.2	exon	phytozomev13	NA	NA	Bd3	49562969	49563051	+	83
BdiBd21-3.3G0639132.v1.2	NA	BdiBd21-3.3G0639132.1.v1.2	exon	phytozomev13	NA	NA	Bd3	49563200	49563872	+	673
BdiBd21-3.3G0639132.v1.2	NA	BdiBd21-3.3G0639132.1.v1.2	transcript	phytozomev13	NA	NA	Bd3	49561897	49563872	+	1976

field	value
#pacId	PAC:42983505
locusName	BdiBd21-3.3G0639132
transcriptName	BdiBd21-3.3G0639132.1
peptideName	BdiBd21-3.3G0639132.1.p
Pfam	PF00248
Panther	PTHR43625:SF29
ec	NA
KOG	EC:1.1.1.317
KO	NA
GO	NA
Best-hit-arabi-name	AT1G60710
Best-hit-arabi-defline	(1 of 6) 1.1.1.317 - perakine reductase. / perakine reductase.
Best-hit-clamy-name	Cre11.g467622
Best-hit-clamy-defline	(1 of 1) 1.1.1.317 - perakine reductase. / perakine reductase.
Best-hit-rice-name	LOC_Os04g26910
Best-hit-rice-defline	(1 of 8) 1.1.1.317 - perakine reductase. / perakine reductase.
locus_clean	BdiBd21-3.3G0639132
transcript_clean	BdiBd21-3.3G0639132.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.3G0687100.v1.2
gene_name	NA
seqname	Bd3
strand	-
start	52833732
end	52835290
gene_length_bp	1559
n_transcripts	1
feature_counts	exon: 1; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.3G0687100.v1.2	NA	BdiBd21-3.3G0687100.1.v1.2	exon	phytozomev13	NA	NA	Bd3	52833732	52835290	-	1559
BdiBd21-3.3G0687100.v1.2	NA	BdiBd21-3.3G0687100.1.v1.2	transcript	phytozomev13	NA	NA	Bd3	52833732	52835290	-	1559

field	value
#pacId	PAC:42981708
locusName	BdiBd21-3.3G0687100
transcriptName	BdiBd21-3.3G0687100.1
peptideName	BdiBd21-3.3G0687100.1.p
Pfam	PF00685
Panther	PTHR11783:SF79
ec	KOG1584
KOG	EC:2.8.2.25
KO	NA
GO	GO:0008146
Best-hit-arabi-name	AT5G07010
Best-hit-arabi-defline	(1 of 2) 2.8.2.39 - hydroxyjasmonate sulfotransferase. / hydroxyjasmonate sulfotransferase.
Best-hit-clamy-name	Cre09.g401960
Best-hit-clamy-defline	(1 of 1) 2.8.2.1 - aryl sulfotransferase. / sulfokinase.
Best-hit-rice-name	LOC_Os02g45890
Best-hit-rice-defline	(1 of 6) 2.8.2.39 - hydroxyjasmonate sulfotransferase. / hydroxyjasmonate sulfotransferase.
locus_clean	BdiBd21-3.3G0687100
transcript_clean	BdiBd21-3.3G0687100.1

field	value
locusName	BdiBd21-3.3G0687100
transcriptName	BdiBd21-3.3G0687100.1
peptideName	BdiBd21-3.3G0687100.1.p
go_id	GO:0008146
TERM	sulfotransferase activity
ONTOLOGY	MF
DEFINITION	Catalysis of the transfer of a sulfate group from 3’-phosphoadenosine 5’-phosphosulfate to the hydroxyl group of an acceptor, producing the sulfated derivative and 3’-phosphoadenosine 5’-phosphate.

key	value
gene_id	BdiBd21-3.3G0774700.v1.2
gene_name	NA
seqname	Bd3
strand	+
start	58186463
end	58188048
gene_length_bp	1586
n_transcripts	1
feature_counts	exon: 3; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.3G0774700.v1.2	NA	BdiBd21-3.3G0774700.1.v1.2	exon	phytozomev13	NA	NA	Bd3	58186463	58186699	+	237
BdiBd21-3.3G0774700.v1.2	NA	BdiBd21-3.3G0774700.1.v1.2	exon	phytozomev13	NA	NA	Bd3	58186807	58186936	+	130
BdiBd21-3.3G0774700.v1.2	NA	BdiBd21-3.3G0774700.1.v1.2	exon	phytozomev13	NA	NA	Bd3	58187059	58188048	+	990
BdiBd21-3.3G0774700.v1.2	NA	BdiBd21-3.3G0774700.1.v1.2	transcript	phytozomev13	NA	NA	Bd3	58186463	58188048	+	1586

field	value
#pacId	PAC:42986289
locusName	BdiBd21-3.3G0774700
transcriptName	BdiBd21-3.3G0774700.1
peptideName	BdiBd21-3.3G0774700.1.p
Pfam	PF00249
Panther	PTHR10641:SF1335
ec	NA
KOG	NA
KO	K09422
GO	NA
Best-hit-arabi-name	AT1G34670
Best-hit-arabi-defline	(1 of 1) PTHR10641:SF1287 - TRANSCRIPTION FACTOR MYB93
Best-hit-clamy-name	Cre16.g677382
Best-hit-clamy-defline	(1 of 1) PTHR47999:SF143 - TRANSCRIPTION FACTOR MYB7
Best-hit-rice-name	LOC_Os06g11780
Best-hit-rice-defline	(1 of 2) PTHR10641:SF1381 - TRANSCRIPTION FACTOR MYB92
locus_clean	BdiBd21-3.3G0774700
transcript_clean	BdiBd21-3.3G0774700.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.3G0782100.v1.2
gene_name	NA
seqname	Bd3
strand	-
start	58613855
end	58617774
gene_length_bp	3920
n_transcripts	1
feature_counts	exon: 5; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.3G0782100.v1.2	NA	BdiBd21-3.3G0782100.1.v1.2	exon	phytozomev13	NA	NA	Bd3	58613855	58614563	-	709
BdiBd21-3.3G0782100.v1.2	NA	BdiBd21-3.3G0782100.1.v1.2	exon	phytozomev13	NA	NA	Bd3	58615150	58615211	-	62
BdiBd21-3.3G0782100.v1.2	NA	BdiBd21-3.3G0782100.1.v1.2	exon	phytozomev13	NA	NA	Bd3	58615321	58615515	-	195
BdiBd21-3.3G0782100.v1.2	NA	BdiBd21-3.3G0782100.1.v1.2	exon	phytozomev13	NA	NA	Bd3	58617120	58617344	-	225
BdiBd21-3.3G0782100.v1.2	NA	BdiBd21-3.3G0782100.1.v1.2	exon	phytozomev13	NA	NA	Bd3	58617465	58617774	-	310
BdiBd21-3.3G0782100.v1.2	NA	BdiBd21-3.3G0782100.1.v1.2	transcript	phytozomev13	NA	NA	Bd3	58613855	58617774	-	3920

field	value
#pacId	PAC:42986202
locusName	BdiBd21-3.3G0782100
transcriptName	BdiBd21-3.3G0782100.1
peptideName	BdiBd21-3.3G0782100.1.p
Pfam	PF00230
Panther	PTHR45724:SF16
ec	KOG0223
KOG	NA
KO	K09874
GO	GO:0015267 GO:0016020 GO:0055085
Best-hit-arabi-name	AT5G37820
Best-hit-arabi-defline	(1 of 1) PTHR45724:SF59 - AQUAPORIN NIP4-2-RELATED
Best-hit-clamy-name	Cre12.g549300
Best-hit-clamy-defline	(1 of 1) PTHR19139:SF199 - AQUAPORIN
Best-hit-rice-name	LOC_Os02g51110
Best-hit-rice-defline	(1 of 1) PTHR45724:SF16 - AQUAPORIN NIP2-1
locus_clean	BdiBd21-3.3G0782100
transcript_clean	BdiBd21-3.3G0782100.1

field	value
locusName	BdiBd21-3.3G0782100
transcriptName	BdiBd21-3.3G0782100.1
peptideName	BdiBd21-3.3G0782100.1.p
go_id	GO:0015267; GO:0016020; GO:0055085
TERM	channel activity; membrane; transmembrane transport
ONTOLOGY	MF; CC; BP
DEFINITION	Enables the energy-independent facilitated diffusion of a solute through a transmembrane aqueous pore or channel. Stereospecificity is not exhibited but this transport may be specific for a particular molecular species or class of molecules.; A lipid bilayer along with all the proteins and protein complexes embedded in it and attached to it.; The process in which a solute is transported across a lipid bilayer, from one side of a membrane to the other.

key	value
gene_id	BdiBd21-3.3G0792700.v1.2
gene_name	NA
seqname	Bd3
strand	+
start	59261533
end	59264181
gene_length_bp	2649
n_transcripts	1
feature_counts	exon: 3; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.3G0792700.v1.2	NA	BdiBd21-3.3G0792700.1.v1.2	exon	phytozomev13	NA	NA	Bd3	59261533	59261932	+	400
BdiBd21-3.3G0792700.v1.2	NA	BdiBd21-3.3G0792700.1.v1.2	exon	phytozomev13	NA	NA	Bd3	59262956	59263085	+	130
BdiBd21-3.3G0792700.v1.2	NA	BdiBd21-3.3G0792700.1.v1.2	exon	phytozomev13	NA	NA	Bd3	59263205	59264181	+	977
BdiBd21-3.3G0792700.v1.2	NA	BdiBd21-3.3G0792700.1.v1.2	transcript	phytozomev13	NA	NA	Bd3	59261533	59264181	+	2649

field	value
#pacId	PAC:42981452
locusName	BdiBd21-3.3G0792700
transcriptName	BdiBd21-3.3G0792700.1
peptideName	BdiBd21-3.3G0792700.1.p
Pfam	PF00249
Panther	PTHR48000:SF57
ec	NA
KOG	NA
KO	K09422
GO	NA
Best-hit-arabi-name	AT5G57620
Best-hit-arabi-defline	(1 of 1) PTHR48000:SF21 - TRANSCRIPTION FACTOR MYB36
Best-hit-clamy-name	Cre16.g677382
Best-hit-clamy-defline	(1 of 1) PTHR47999:SF143 - TRANSCRIPTION FACTOR MYB7
Best-hit-rice-name	LOC_Os02g54520
Best-hit-rice-defline	(1 of 1) PTHR48000:SF57 - OS02G0786400 PROTEIN
locus_clean	BdiBd21-3.3G0792700
transcript_clean	BdiBd21-3.3G0792700.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.4G0260700.v1.2
gene_name	NA
seqname	Bd4
strand	+
start	20067098
end	20069128
gene_length_bp	2031
n_transcripts	1
feature_counts	exon: 5; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.4G0260700.v1.2	NA	BdiBd21-3.4G0260700.1.v1.2	exon	phytozomev13	NA	NA	Bd4	20067098	20067580	+	483
BdiBd21-3.4G0260700.v1.2	NA	BdiBd21-3.4G0260700.1.v1.2	exon	phytozomev13	NA	NA	Bd4	20067656	20067868	+	213
BdiBd21-3.4G0260700.v1.2	NA	BdiBd21-3.4G0260700.1.v1.2	exon	phytozomev13	NA	NA	Bd4	20067955	20068103	+	149
BdiBd21-3.4G0260700.v1.2	NA	BdiBd21-3.4G0260700.1.v1.2	exon	phytozomev13	NA	NA	Bd4	20068203	20068476	+	274
BdiBd21-3.4G0260700.v1.2	NA	BdiBd21-3.4G0260700.1.v1.2	exon	phytozomev13	NA	NA	Bd4	20068550	20069128	+	579
BdiBd21-3.4G0260700.v1.2	NA	BdiBd21-3.4G0260700.1.v1.2	transcript	phytozomev13	NA	NA	Bd4	20067098	20069128	+	2031

X.pacId	locusName	transcriptName	peptideName	Pfam	Panther	ec	KOG	KO	GO	Best.hit.arabi.name	Best.hit.arabi.defline	Best.hit.clamy.name	Best.hit.clamy.defline	Best.hit.rice.name	Best.hit.rice.defline	locus_clean	transcript_clean
PAC:42947929	BdiBd21-3.4G0260700	BdiBd21-3.4G0260700.1	BdiBd21-3.4G0260700.1.p	PF00657	PTHR22835:SF677	NA	EC:2.3.1.98	NA	GO:0016788	AT1G28640	(1 of 4) PTHR22835:SF522 - SINAPINE ESTERASE	NA	NA	LOC_Os11g31940	(1 of 1) PTHR22835:SF677 - GDSL-LIKE LIPASE_ACYLHYDROLASE FAMILY PROTEIN, EXPRESSED	BdiBd21-3.4G0260700	BdiBd21-3.4G0260700.1

gene_summary\(jgi\)go_kv

key	value
gene_id	BdiBd21-3.4G0506300.v1.2
gene_name	NA
seqname	Bd4
strand	+
start	41793635
end	41795759
gene_length_bp	2125
n_transcripts	1
feature_counts	exon: 1; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.4G0506300.v1.2	NA	BdiBd21-3.4G0506300.1.v1.2	exon	phytozomev13	NA	NA	Bd4	41793635	41795759	+	2125
BdiBd21-3.4G0506300.v1.2	NA	BdiBd21-3.4G0506300.1.v1.2	transcript	phytozomev13	NA	NA	Bd4	41793635	41795759	+	2125

field	value
#pacId	PAC:42941674
locusName	BdiBd21-3.4G0506300
transcriptName	BdiBd21-3.4G0506300.1
peptideName	BdiBd21-3.4G0506300.1.p
Pfam	NA
Panther	PTHR36481:SF1
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	NA
Best-hit-arabi-defline	NA
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os09g36490
Best-hit-rice-defline	(1 of 136) IPR036426 - Bulb-type lectin domain superfamily
locus_clean	BdiBd21-3.4G0506300
transcript_clean	BdiBd21-3.4G0506300.1

table vide/incorrecte

key	value
gene_id	BdiBd21-3.5G0204500.v1.2
gene_name	NA
seqname	Bd5
strand	+
start	19403060
end	19404346
gene_length_bp	1287
n_transcripts	1
feature_counts	exon: 3; transcript: 1

gene_id	gene_name	transcript_id	type	source	score	phase	seqname	start	end	strand	width
BdiBd21-3.5G0204500.v1.2	NA	BdiBd21-3.5G0204500.1.v1.2	exon	phytozomev13	NA	NA	Bd5	19403060	19403488	+	429
BdiBd21-3.5G0204500.v1.2	NA	BdiBd21-3.5G0204500.1.v1.2	exon	phytozomev13	NA	NA	Bd5	19403572	19403695	+	124
BdiBd21-3.5G0204500.v1.2	NA	BdiBd21-3.5G0204500.1.v1.2	exon	phytozomev13	NA	NA	Bd5	19403800	19404346	+	547
BdiBd21-3.5G0204500.v1.2	NA	BdiBd21-3.5G0204500.1.v1.2	transcript	phytozomev13	NA	NA	Bd5	19403060	19404346	+	1287

field	value
#pacId	PAC:42952824
locusName	BdiBd21-3.5G0204500
transcriptName	BdiBd21-3.5G0204500.1
peptideName	BdiBd21-3.5G0204500.1.p
Pfam	PF04535
Panther	PTHR36488:SF8
ec	NA
KOG	NA
KO	NA
GO	NA
Best-hit-arabi-name	AT3G11550
Best-hit-arabi-defline	(1 of 13) PTHR36488:SF8 - CASP-LIKE PROTEIN 1U1
Best-hit-clamy-name	NA
Best-hit-clamy-defline	NA
Best-hit-rice-name	LOC_Os04g58760
Best-hit-rice-defline	(1 of 11) PTHR36488:SF8 - CASP-LIKE PROTEIN 1U1
locus_clean	BdiBd21-3.5G0204500
transcript_clean	BdiBd21-3.5G0204500.1

table vide/incorrecte

These plots show in which clusters the candidate pericycle marker BdiBd21-3.4G0260700 is most strongly expressed (barplot), how its expression is distributed within each cluster (violin), and how its average expression varies jointly with cluster identity and timepoint (heatmap). The mean-expression barplot highlights the cluster where BdiBd21-3.5G0204500 is most enriched, the violin plot shows how specific this enrichment is compared to other clusters, and the UMAP views reveal where these expressing cells sit in the global embedding and across timepoints. The associated markers_gene2 table (especially the p_val_adj column) indicates whether this enrichment is statistically significant.