## ----include = FALSE----------------------------------------------------------
knitr::opts_chunk$set(
  collapse = TRUE,
  comment = "#>",
  eval = FALSE
)

## ----setup--------------------------------------------------------------------
# library(unitcm)

## ----search-basic-------------------------------------------------------------
# # Free-text search across all fields
# hits <- search_target2np(search = "quercetin")
# hits
# 
# # Exact-match by gene symbol
# tp53 <- search_target2np(
#   search = "TP53",
#   search_field = "gene_symbol",
#   search_mode = "exact"
# )
# tp53
# attr(tp53, "total")

## ----search-filters-----------------------------------------------------------
# # Combine filters
# results <- search_target2np(
#   search = "curcumin",
#   search_field = "compound_name",
#   source_db = "BindingDB",
#   target_organism = "Homo sapiens",
#   activity_type = "IC50"
# )
# results

## ----filter-options-----------------------------------------------------------
# # What filter values exist?
# opts <- fetch_target2np_filters()
# opts$source_db
# opts$target_organism
# opts$activity_type
# 
# # Global database statistics
# stats <- fetch_target2np_stats()
# stats$total_records
# stats$source_db_distribution

## ----detail-------------------------------------------------------------------
# detail <- get_target2np(1)
# detail$compound_name
# detail$gene_symbol
# detail$activity_value
# detail$activity_units
# detail$pmid

## ----batch--------------------------------------------------------------------
# batch <- batch_target2np(c("TP53", "BRCA1", "EGFR", "VEGFA"))
# batch
# attr(batch, "queries_matched")
# attr(batch, "queries_not_found")
# 
# # UniProt-based batch
# batch_up <- batch_target2np(
#   c("P04637", "P38398"),
#   id_type = "uniprot_id"
# )

## ----drugclip-----------------------------------------------------------------
# # High-confidence predictions for quercetin
# dc_high <- search_target2np_drugclip(
#   search = "quercetin",
#   search_field = "compound_name",
#   confidence = "high"
# )
# dc_high
# 
# # Score-based filtering
# dc <- search_target2np_drugclip(
#   search = "EGFR",
#   search_field = "gene_symbol",
#   min_score = 0.7
# )
# dc

## ----sea----------------------------------------------------------------------
# # High-confidence SEA predictions
# sea_high <- search_target2np_sea(
#   search = "quercetin",
#   search_field = "compound_name",
#   confidence = "high"
# )
# sea_high
# 
# # Filter by adjusted p-value
# sea <- search_target2np_sea(
#   search = "TP53",
#   search_field = "gene_symbol",
#   max_pvalue = 0.01
# )
# sea

## ----multi-source-------------------------------------------------------------
# summary <- target2np_multi_source_summary(
#   search = "TP53",
#   search_field = "gene_symbol"
# )
# 
# # How many results per source?
# summary$source_counts
# 
# # Target overlap across data sources
# summary$target_overlap
# 
# # Confidence-level distribution for each source
# summary$confidence_distribution
# 
# # Compound-target pairs found in >= 2 sources
# summary$cross_validated
# 
# # Natural-language interpretation
# cat(summary$suggestion_text)

## ----aggregated---------------------------------------------------------------
# # Pairs seen in >= 3 databases
# agg <- aggregated_target2np(
#   search = "quercetin",
#   min_sources = 3
# )
# agg
# 
# # Include DrugCLIP/SEA prediction counts as additional sources
# agg_pred <- aggregated_target2np(
#   search = "quercetin",
#   min_sources = 2,
#   include_predictions = TRUE
# )
# agg_pred

## ----workflow-----------------------------------------------------------------
# # 1. Check experimental evidence
# exp <- search_target2np(
#   search = "quercetin",
#   search_field = "compound_name",
#   search_mode = "fuzzy",
#   all_pages = TRUE
# )
# nrow(exp)
# 
# # 2. Get multi-source summary in one call
# ms <- target2np_multi_source_summary(
#   search = "quercetin",
#   search_field = "compound_name",
#   search_mode = "fuzzy"
# )
# ms$source_counts
# ms$cross_validated
# 
# # 3. Batch-check the top cross-validated targets
# top_genes <- unique(vapply(
#   ms$cross_validated, `[[`, character(1), "gene_symbol"
# ))
# if (length(top_genes) > 0) {
#   batch_detail <- batch_target2np(top_genes)
#   batch_detail
# }